framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,16,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,16,balanced,0.048101335763931274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,16,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,16,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,16,balanced,0.05357866485913595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,16,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,16,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,16,balanced,0.05731200178464254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,16,balanced,0.05698133508364359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,16,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,16,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,16,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,16,balanced,0.06022400160630544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,16,balanced,0.061434666315714516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,16,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,16,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,16,balanced,0.06809600194295247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,16,balanced,0.08226133386294048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,16,balanced,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,128,power_law_1.2,0.02109439969062805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,16,balanced,0.1389226714769999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,128,power_law_1.2,0.02109439969062805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,16,balanced,0.20974934101104736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,128,power_law_1.2,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,16,balanced,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,128,power_law_1.2,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,16,balanced,0.3423573176066081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,128,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,16,balanced,0.5461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,128,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,128,power_law_1.2,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,16,balanced,0.6654133399327596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,128,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,128,power_law_1.2,0.027020800113677978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,128,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,16,balanced,1.1125760078430176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,128,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,128,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,128,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,16,balanced,1.4301600456237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,128,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,128,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,128,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,128,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,128,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,128,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,128,power_law_1.2,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,128,power_law_1.2,0.15523840188980104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,128,power_law_1.2,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,128,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,128,power_law_1.2,0.4712384223937988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,128,power_law_1.2,0.5670911788940429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,128,power_law_1.2,0.8511296272277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,16,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,16,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,16,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,16,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,16,balanced,0.2954240043958028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,16,balanced,0.4270079930623372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,16,balanced,0.41864534219106037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,16,balanced,0.4203519821166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,16,balanced,0.42137598991394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,16,balanced,0.4261546532313029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,16,balanced,0.43110398451487225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,16,balanced,0.4331253369649251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,16,balanced,0.4394666751225789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,16,balanced,0.4485119978586833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,16,balanced,0.45431466897328693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,16,balanced,0.46865065892537433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,16,balanced,0.49595733483632404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,16,balanced,0.5259946584701538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,16,balanced,0.5765120188395182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,16,balanced,0.6203733285268148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,16,balanced,0.7043413321177164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,16,balanced,0.8058880170186361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,16,balanced,1.0763946374257405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,16,balanced,1.3760852813720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,16,balanced,1.9095892906188965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,16,balanced,2.473301410675049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,2,power_law_1.2,0.8404864311218262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,2,power_law_1.2,1.1384832382202148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,2,power_law_1.2,1.336524772644043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,2,power_law_1.2,2.0924415588378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,2,power_law_1.2,2.0527103424072264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,2,power_law_1.2,2.0766719818115233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,2,power_law_1.2,2.1004287719726564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,2,power_law_1.2,2.532147216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,2,power_law_1.2,2.856550407409668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,2,power_law_1.2,3.0277631759643553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,2,power_law_1.2,2.59686393737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,2,power_law_1.2,2.997043228149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,2,power_law_1.2,3.0136320114135744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,2,power_law_1.2,3.6571136474609376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,2,power_law_1.2,3.829964828491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,2,power_law_1.2,4.483276748657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,2,power_law_1.2,5.063679885864258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,2,power_law_1.2,7.650918579101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,2,power_law_1.2,9.249177551269531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,2,power_law_1.2,9.954508972167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,2,power_law_1.2,12.443443298339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,2,power_law_1.2,14.94323272705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,128,power_law_1.2,1.2589056015014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,2,power_law_1.2,19.068313598632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,2,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,2,power_law_1.2,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,2,power_law_1.2,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,2,power_law_1.2,0.7041024208068848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,2,power_law_1.2,1.0358783721923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,2,power_law_1.2,1.45797119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,2,power_law_1.2,1.6013311386108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,2,power_law_1.2,2.1284799575805664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,2,power_law_1.2,2.1014528274536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,2,power_law_1.2,2.106163215637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,2,power_law_1.2,2.3191551208496093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,2,power_law_1.2,2.353766441345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,2,power_law_1.2,2.4008703231811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,2,power_law_1.2,2.3941120147705077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,2,power_law_1.2,2.5278335571289063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,2,power_law_1.2,2.6849279403686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,2,power_law_1.2,2.695782470703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,2,power_law_1.2,3.020800018310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,2,power_law_1.2,3.2284671783447267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,2,power_law_1.2,3.339468765258789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,2,power_law_1.2,3.5946495056152346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,2,power_law_1.2,4.2260478973388675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,2,power_law_1.2,4.733337783813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,2,power_law_1.2,5.71412467956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,2,power_law_1.2,7.160422515869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,2,power_law_1.2,9.082265472412109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,2,power_law_1.2,11.418828582763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,2,power_law_1.2,26.15233154296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,2,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,2,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,2,balanced,0.532309333483378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,2,balanced,1.0466773509979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,2,balanced,2.0387840270996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,2,balanced,4.062037467956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,2,balanced,4.077055931091309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,2,balanced,4.114432017008464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,2,balanced,4.1260372797648115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,2,balanced,4.134570757548015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,2,balanced,4.047189394632976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,2,balanced,4.072618802388509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,2,balanced,4.087807973225911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,2,balanced,4.12501335144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,2,balanced,4.157951990763347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,2,balanced,4.1854292551676435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,2,balanced,4.245674769083659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,2,balanced,4.365482648213704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,2,balanced,4.474874814351399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,2,balanced,4.685311953226726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,1,balanced,1.1233279705047607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,1,balanced,2.189823945363363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,2,balanced,4.941141446431478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,1,balanced,4.329301198323567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,2,balanced,5.484202702840169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,1,balanced,8.557909647623697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,2,balanced,5.864959716796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,2,power_law_1.2,27.63591613769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,2,balanced,6.476800282796224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,1,balanced,17.00334930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,2,balanced,7.476906458536784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,2,balanced,10.070186614990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,1,balanced,21.241514841715496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,2,balanced,12.442085266113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,1,balanced,21.271722157796223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,1,balanced,21.29899724324544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,1,balanced,21.330603281656902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,1,balanced,21.364725748697918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,2,balanced,0.2676053245862325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,2,balanced,0.45687464872996014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,2,balanced,0.9181866645812988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,2,balanced,0.8862720330556234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,2,balanced,0.8884906768798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,2,balanced,0.8939519723256429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,1,balanced,21.443753560384113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,2,balanced,0.8980480035146078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,2,balanced,0.9024853706359863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,2,balanced,0.9065706729888916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,2,balanced,0.9101653099060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,2,balanced,0.922111988067627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,2,balanced,0.92740265528361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,2,balanced,0.9413973490397135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,2,balanced,0.9966933727264404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,2,balanced,1.0296320120493572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,2,balanced,1.0455040136973064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,2,balanced,1.0678613185882568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,2,balanced,1.4895787239074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,2,balanced,1.577130635579427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,2,balanced,1.9070293108622234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,1,balanced,21.484542846679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,2,balanced,2.2574079831441245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,2,balanced,3.1819092432657876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,2,balanced,4.0352427164713545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,2,balanced,5.78985595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,1,balanced,21.600596110026043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,2,balanced,7.416831970214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,2,balanced,10.825215657552084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,1,balanced,21.687978108723957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,2,balanced,14.231722513834635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,1,balanced,21.843963623046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,1,balanced,22.759742736816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,1,balanced,22.93469746907552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,1,balanced,24.0894292195638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,2,power_law_1.2,37.673779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,1,balanced,23.915008544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,1,balanced,30.014617919921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,1,balanced,27.732991536458332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,1,balanced,31.02429962158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,1,balanced,29.736788431803387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,1,balanced,35.80825551350912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,4,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,4,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,4,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,4,balanced,0.06741333504517873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,4,balanced,0.24439465999603271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,4,balanced,0.24627200762430826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,4,balanced,0.24710400899251303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,4,balanced,0.24780799945195517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,4,balanced,0.24882133801778158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,4,balanced,0.24934399127960205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,4,balanced,0.24456000328063965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,4,balanced,0.2469546596209208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,4,balanced,0.24849067131678262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,4,balanced,0.2505386670430501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,4,balanced,0.2561653256416321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,4,balanced,0.2585386633872986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,4,balanced,0.2728959918022156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,4,balanced,0.28363200028737384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,4,balanced,0.289792001247406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,4,balanced,0.31214932600657147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,4,balanced,0.342682679494222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,4,balanced,0.40192000071207684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,4,balanced,0.4652373393376668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,4,balanced,0.6275413433710734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,4,balanced,0.8193706671396891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,4,balanced,1.2028586864471436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,4,balanced,1.6008532842000325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,1,balanced,40.003926595052086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,1,balanced,52.08012898763021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,1,balanced,67.77207438151042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,2,power_law_1.2,51.61574096679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,4,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,4,power_law_1.01,0.02598400115966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,4,power_law_1.01,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,4,power_law_1.01,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,4,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,4,power_law_1.01,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,4,power_law_1.01,0.21913599967956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,4,power_law_1.01,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,4,power_law_1.01,0.22364161014556885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,4,power_law_1.01,0.23224320411682128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,4,power_law_1.01,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,4,power_law_1.01,0.23797760009765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,4,power_law_1.01,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,4,power_law_1.01,0.23797760009765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,4,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,4,power_law_1.01,0.24145278930664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,4,power_law_1.01,0.25722880363464357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,4,power_law_1.01,0.25927679538726806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,4,power_law_1.01,0.2799616098403931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,4,power_law_1.01,0.30986239910125735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,4,power_law_1.01,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,4,power_law_1.01,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,4,power_law_1.01,0.5396480083465576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,4,power_law_1.01,0.8333312034606933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,4,power_law_1.01,1.0321920394897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,4,power_law_1.01,1.641062355041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,4,power_law_1.01,2.375654411315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,8,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,8,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,8,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,8,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,8,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,8,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,8,power_law_1.01,0.04196479916572571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,8,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,8,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,8,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,8,power_law_1.01,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,8,power_law_1.01,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,8,power_law_1.01,0.1183743953704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,8,power_law_1.01,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,8,power_law_1.01,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,8,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,8,power_law_1.01,0.40468478202819824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,8,power_law_1.01,0.5203968048095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,8,power_law_1.01,0.7665599822998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,8,power_law_1.01,1.1554816246032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,8,power_law_1.01,1.7520639419555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,8,power_law_1.01,2.1823488235473634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,4,power_law_1.2,0.042156800627708435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,4,power_law_1.2,0.17424639463424682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,4,power_law_1.2,0.18943359851837158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,4,power_law_1.2,0.30368640422821047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,4,power_law_1.2,0.4122623920440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,4,power_law_1.2,0.3389440059661865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,4,power_law_1.2,0.6076416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,4,power_law_1.2,0.5445631980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,4,power_law_1.2,0.57259521484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,4,power_law_1.2,0.5654528141021729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,4,power_law_1.2,0.6002687931060791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,4,power_law_1.2,0.5810175895690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,4,power_law_1.2,0.6410240173339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,4,power_law_1.2,0.6469632148742676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,4,power_law_1.2,0.6369279861450196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,4,power_law_1.2,0.6856704235076905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,4,power_law_1.2,0.6832128047943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,4,power_law_1.2,0.7411712169647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,4,power_law_1.2,0.7030784130096436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,4,power_law_1.2,0.8278016090393067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,4,power_law_1.2,0.9078783988952637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,4,power_law_1.2,1.072537612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,4,power_law_1.2,1.3479743957519532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,4,power_law_1.2,1.7289215087890626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,4,power_law_1.2,2.0604927062988283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,4,power_law_1.2,3.1246335983276365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,4,power_law_1.2,3.6911102294921876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,8,power_law_1.01,0.15237120389938355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,8,power_law_1.01,0.09113600254058837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,8,power_law_1.01,0.18472959995269775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,8,power_law_1.01,0.20930559635162355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,8,power_law_1.01,0.2367487907409668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,8,power_law_1.01,0.23347198963165283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,8,power_law_1.01,0.23470079898834229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,8,power_law_1.01,0.23571200370788575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,8,power_law_1.01,0.232857608795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,8,power_law_1.01,0.24453120231628417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,8,power_law_1.01,0.2486272096633911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,8,power_law_1.01,0.2545664072036743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,8,power_law_1.01,0.27013120651245115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,8,power_law_1.01,0.2574336051940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,8,power_law_1.01,0.2705343961715698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,8,power_law_1.01,0.2748415946960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,8,power_law_1.01,0.2899967908859253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,8,power_law_1.01,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,8,power_law_1.01,0.30842878818511965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,8,power_law_1.01,0.35715839862823484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,8,power_law_1.01,0.42598400115966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,8,power_law_1.01,0.5189631938934326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,8,power_law_1.01,0.7776256084442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,8,power_law_1.01,1.0043392181396484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,8,power_law_1.01,1.386905574798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,8,power_law_1.01,2.188492774963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,8,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,8,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,8,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,8,balanced,0.279039998849233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,8,balanced,0.5302613178888956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,8,balanced,1.039189338684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,8,balanced,1.53548796971639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,8,balanced,1.5378774007161458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,8,balanced,1.5400959650675456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,8,balanced,1.543168067932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,8,balanced,1.5542613665262859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,8,balanced,1.5593546231587727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,8,balanced,1.5650134086608887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,8,balanced,1.57149871190389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,8,balanced,1.583957354227702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,8,balanced,1.5912960370381672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,8,balanced,1.614506721496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,8,balanced,1.6561493873596191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,8,balanced,1.7203200658162434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,8,balanced,1.7995093663533528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,8,balanced,1.87391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,8,balanced,2.0358826319376626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,8,balanced,2.2623573939005532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,8,balanced,2.528085390726725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,8,balanced,2.868053436279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,8,balanced,3.626666704813639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,8,balanced,4.495018641153972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,8,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,8,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,8,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,8,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,8,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,8,power_law_1.01,0.027020800113677978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,8,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,8,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,8,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,8,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,8,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,8,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,8,power_law_1.01,0.03478400111198425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,8,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,8,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,8,power_law_1.2,0.5189568042755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,8,power_law_1.2,0.5189631938934326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,8,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,8,power_law_1.2,0.5195775985717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,8,power_law_1.2,0.521011209487915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,8,power_law_1.2,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,8,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,8,power_law_1.2,0.6752255916595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,8,power_law_1.01,0.08417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,8,power_law_1.2,0.7491583824157715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,8,power_law_1.01,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,8,power_law_1.2,0.9539584159851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,8,power_law_1.2,1.0387455940246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,8,power_law_1.01,0.12738560438156127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,8,power_law_1.2,0.9070591926574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,8,power_law_1.2,1.2496895790100098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,8,power_law_1.2,1.2128255844116211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,8,power_law_1.2,1.7944448471069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,8,power_law_1.01,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,8,power_law_1.2,2.2659072875976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,8,power_law_1.2,2.3771135330200197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,8,power_law_1.2,3.0664703369140627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,8,power_law_1.01,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,8,power_law_1.2,4.158246231079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,8,power_law_1.2,5.33831672668457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,8,power_law_1.2,7.0883331298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,8,power_law_1.01,0.42885122299194334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,8,power_law_1.2,8.41891860961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,8,power_law_1.2,10.99120635986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,8,power_law_1.01,0.6209536075592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,2,power_law_1.2,1.1290623664855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,2,power_law_1.2,2.016870307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,2,power_law_1.2,2.980659294128418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,2,power_law_1.2,4.780851364135742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,2,power_law_1.2,6.687948608398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,2,power_law_1.2,8.681267547607423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,2,power_law_1.2,12.203826904296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,8,power_law_1.2,13.597491455078124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,2,power_law_1.2,12.678553771972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,2,power_law_1.2,12.880889892578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,2,power_law_1.2,12.701081848144531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,2,power_law_1.2,13.504716491699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,2,power_law_1.2,13.94913330078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,8,power_law_1.01,0.8157183647155761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,8,power_law_1.2,16.83599395751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,2,power_law_1.2,14.185881042480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,2,power_law_1.2,14.935244750976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,2,power_law_1.2,14.671257019042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,2,power_law_1.2,16.036863708496092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,4,balanced,0.4452693462371826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,4,balanced,0.8029867013295492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,4,balanced,1.567914644877116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,4,balanced,3.133082707722982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,4,balanced,5.925034840901692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,2,power_law_1.2,16.559922790527345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,8,power_law_1.01,1.2744704246520997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,4,balanced,8.290304183959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,4,balanced,8.319146474202475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,4,balanced,8.145919799804688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,2,power_law_1.2,16.810394287109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,4,balanced,8.163839975992838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,4,balanced,8.180394490559896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,2,power_law_1.2,17.33632049560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,4,balanced,8.20582389831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,4,balanced,8.236197153727213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,4,balanced,8.255658467610678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,2,power_law_1.2,19.048243713378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,4,balanced,8.301738739013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,4,balanced,8.346965154012045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,8,power_law_1.2,20.516659545898438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,4,balanced,8.390314737955729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,2,power_law_1.2,19.85761260986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,4,balanced,8.470698674519857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,4,balanced,9.406122843424479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,8,power_law_1.01,0.2717695951461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,4,balanced,8.941738764444986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,8,power_law_1.01,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,8,power_law_1.01,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,8,power_law_1.01,0.27381761074066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,8,power_law_1.01,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,8,power_law_1.01,0.27873280048370364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,2,power_law_1.2,21.685043334960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,8,power_law_1.01,0.31928319931030275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,8,power_law_1.01,0.32665600776672366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,8,power_law_1.01,0.34406399726867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,4,balanced,10.003114700317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,8,power_law_1.01,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,8,power_law_1.01,0.5095424175262451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,8,power_law_1.01,0.6549503803253174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,8,power_law_1.01,0.7493631839752197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,8,power_law_1.01,0.6281216144561768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,4,balanced,8.892074584960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,8,power_law_1.01,1.8696191787719727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,8,power_law_1.01,0.7241727828979492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,8,power_law_1.01,0.775167989730835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,8,power_law_1.01,0.873472023010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,4,balanced,9.45083745320638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,8,power_law_1.01,1.1345919609069823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,2,power_law_1.2,27.027252197265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,8,power_law_1.01,1.3367296218872071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,4,balanced,9.941845575968424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,4,balanced,11.32748794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,8,power_law_1.01,1.9290111541748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,8,power_law_1.01,2.087936019897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,4,balanced,12.344319661458334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,2,power_law_1.2,34.31403503417969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,4,balanced,16.245248158772785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,4,balanced,19.702442169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,2,power_law_1.2,31.934463500976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,8,power_law_1.01,3.4764801025390626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,8,power_law_1.2,26.6287109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,2,power_law_1.2,43.15709533691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,8,power_law_1.01,4.389888000488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,2,power_law_1.2,49.456536865234376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,8,power_law_1.01,5.722931289672852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,8,power_law_1.01,7.307878112792968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,8,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,8,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,8,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,8,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,8,balanced,0.08719999591509502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,8,balanced,0.202239990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,8,balanced,0.2039466698964437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,8,balanced,0.20548266172409058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,8,balanced,0.20565332969029745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,8,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,8,balanced,0.20974934101104736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,8,balanced,0.2129653294881185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,8,balanced,0.2155359983444214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,8,balanced,0.22066134214401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,8,balanced,0.22732800245285034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,8,balanced,0.2310826579729716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,8,balanced,0.24422399202982584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,8,balanced,0.26450665791829425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,8,balanced,0.2887413303057353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,8,balanced,0.34833065668741864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,8,balanced,0.37990399201711017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,8,balanced,0.4877653519312541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,8,balanced,0.6063786745071411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,8,balanced,0.9671680132548014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,8,balanced,1.2769280274709065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,8,balanced,1.8995200792948406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,8,balanced,2.4635732968648276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,8,power_law_1.01,10.609254455566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,8,power_law_1.2,34.08506774902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,8,power_law_1.01,13.644184875488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,4,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,4,power_law_1.01,0.05139200091361999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,4,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,4,power_law_1.01,0.12451839447021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,4,power_law_1.01,0.2197376012802124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,4,power_law_1.01,0.2519040107727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,4,power_law_1.01,0.28733439445495607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,4,power_law_1.01,0.2678783893585205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,4,power_law_1.01,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,4,power_law_1.01,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,4,power_law_1.01,0.30556159019470214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,4,power_law_1.01,0.33729920387268064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,4,power_law_1.01,0.318668794631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,4,power_law_1.01,0.33771519660949706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,4,power_law_1.01,0.38359038829803466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,4,power_law_1.01,0.3483648061752319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,4,power_law_1.01,0.37109758853912356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,4,power_law_1.01,0.416153621673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,4,power_law_1.01,0.42045440673828127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,4,power_law_1.01,0.4655104160308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,4,power_law_1.01,0.5124095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,4,power_law_1.01,0.6510591983795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,4,power_law_1.01,0.7407616138458252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,4,power_law_1.01,1.1040767669677733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,4,power_law_1.01,1.3023232460021972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,4,power_law_1.01,1.9499008178710937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,4,power_law_1.01,2.664633560180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,4,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,4,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,4,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,4,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,4,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,4,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,4,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,4,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,4,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,4,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,4,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,4,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,4,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,4,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,4,power_law_1.2,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,4,power_law_1.2,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,4,power_law_1.2,0.10914560556411743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,4,power_law_1.2,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,4,power_law_1.2,0.20971519947052003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,4,power_law_1.2,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,4,power_law_1.2,0.38236160278320314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,4,power_law_1.2,0.5746687889099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,4,power_law_1.2,0.8480768203735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,4,power_law_1.2,1.3797375679016113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,4,power_law_1.2,1.755955123901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,128,power_law_1.01,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,128,power_law_1.01,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,128,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,128,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,128,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,128,power_law_1.01,0.022924800217151643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,128,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,128,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,128,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,128,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,128,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,128,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,128,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,128,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,128,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,128,power_law_1.01,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,128,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,128,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,128,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,128,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,128,power_law_1.01,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,128,power_law_1.01,0.14417920112609864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,128,power_law_1.01,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,128,power_law_1.01,0.255180811882019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,128,power_law_1.01,0.33177599906921384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,128,power_law_1.01,0.5703680038452148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,128,power_law_1.01,0.7464960098266602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,128,power_law_1.2,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,128,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,128,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,128,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,128,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,128,power_law_1.2,0.05422719717025757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,128,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,128,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,128,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,128,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,128,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,128,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,128,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,128,power_law_1.2,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,128,power_law_1.2,0.10076160430908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,4,power_law_1.2,2.5600000381469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,128,power_law_1.2,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,128,power_law_1.2,0.14335999488830567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,128,power_law_1.2,0.20559999942779542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,128,power_law_1.2,0.2420736074447632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,128,power_law_1.2,0.3047424077987671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,128,power_law_1.2,0.4384768009185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,128,power_law_1.2,0.6514688014984131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,128,power_law_1.2,0.7473023891448974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,128,power_law_1.2,1.2109760284423827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,128,power_law_1.2,1.6891904830932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,128,power_law_1.2,2.487295913696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,128,power_law_1.2,3.3882110595703123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,64,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,64,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,64,power_law_1.01,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,64,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,64,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,64,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,64,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,64,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,64,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,64,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,64,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,64,power_law_1.01,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,64,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,64,power_law_1.01,0.0685696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,64,power_law_1.01,0.0802623987197876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,64,power_law_1.01,0.07820799946784973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,64,power_law_1.01,0.1013759970664978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,64,power_law_1.01,0.14313600063323975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,64,power_law_1.01,0.1955839991569519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,64,power_law_1.01,0.2367232084274292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,64,power_law_1.01,0.28733439445495607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,2,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,2,balanced,0.029343999922275543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,2,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,2,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,2,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,2,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,2,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,64,power_law_1.01,0.3739327907562256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,2,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,2,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,2,balanced,0.049653331438700356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,2,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,2,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,2,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,2,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,2,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,2,balanced,0.0988159974416097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,2,balanced,0.15308800339698792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,2,balanced,0.20923733711242676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,2,balanced,0.24883200724919638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,2,balanced,0.3109546701113383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,2,balanced,0.3829760154088338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,64,power_law_1.01,0.4462592124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,2,balanced,0.59443199634552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,2,balanced,0.7995733420054117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,64,power_law_1.01,0.7470975875854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,2,balanced,1.2922879854838054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,2,balanced,1.746773401896159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,64,power_law_1.01,0.8976384162902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,2,balanced,2.7267414728800454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,64,power_law_1.01,1.700454330444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,2,balanced,3.727871894836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,64,power_law_1.01,2.084454345703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,4,power_law_1.2,3.5559104919433593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,2,power_law_1.2,0.32561280727386477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,2,power_law_1.2,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,2,power_law_1.2,0.8996864318847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,2,power_law_1.2,1.4323391914367676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,2,power_law_1.2,1.8911231994628905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,2,power_law_1.2,2.626560020446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,2,power_law_1.2,3.3290241241455076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,2,power_law_1.2,4.294041442871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,2,power_law_1.2,4.374732971191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,2,power_law_1.2,4.562329483032227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,2,power_law_1.2,4.688486480712891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,2,power_law_1.2,4.926464080810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,2,power_law_1.2,4.699135971069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,2,power_law_1.2,4.803788757324218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,2,power_law_1.2,5.065932846069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,2,power_law_1.2,4.857408142089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,2,power_law_1.2,5.42289924621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,2,power_law_1.2,5.474303817749023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,2,power_law_1.2,5.884723281860351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,2,power_law_1.2,6.207078552246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,2,power_law_1.2,6.7688446044921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,2,power_law_1.2,7.176582336425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,2,power_law_1.2,8.339250946044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,2,power_law_1.2,9.822003173828126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,2,power_law_1.2,11.510784149169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,2,power_law_1.2,14.98787841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,2,power_law_1.2,17.22081298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,2,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,2,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,2,balanced,0.16759467124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,2,balanced,0.3553280035654704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,2,balanced,0.672426700592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,2,balanced,1.3064533074696858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,2,balanced,1.3122560183207195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,2,balanced,1.3204480012257893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,2,balanced,1.3262506326039631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,2,balanced,1.3294933636983235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,2,balanced,1.3340959548950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,2,balanced,1.3436586062113445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,2,balanced,1.3527040481567383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,2,balanced,1.3658453623453777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,2,balanced,1.3805173238118489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,2,balanced,1.3928106625874836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,2,balanced,1.4149972597757976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,2,balanced,1.4679039319356282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,2,balanced,1.5201279322306316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,2,balanced,1.6349867184956868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,2,balanced,1.72270933787028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,2,balanced,1.8930346171061199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,2,balanced,2.0962986946105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,2,balanced,2.5053866704305015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,2,balanced,2.899285316467285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,2,balanced,3.7886292139689126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,2,balanced,4.913322766621907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,1,balanced,0.5889706611633301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,1,balanced,1.0335573355356853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,1,balanced,2.033141295115153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,1,balanced,4.111530621846517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,1,balanced,7.957333246866862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,1,balanced,15.859882354736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,1,balanced,15.892468770345053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,1,balanced,15.912277221679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,1,balanced,15.949483235677084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,1,balanced,15.967231750488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,1,balanced,16.02577082316081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,1,balanced,16.06604766845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,1,balanced,16.109909057617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,1,balanced,16.19421895345052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,1,balanced,16.289620717366535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,1,balanced,16.355499267578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,1,balanced,16.501759847005207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,1,balanced,17.327274322509766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,32,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,32,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,32,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,32,power_law_1.2,0.02927359938621521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,32,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,32,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,32,power_law_1.2,0.03214719891548157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,32,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,32,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,32,power_law_1.2,0.03971840143203735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,32,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,32,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,32,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,1,balanced,17.72219721476237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,32,power_law_1.2,0.06266239881515503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,32,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,32,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,32,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,32,power_law_1.2,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,32,power_law_1.2,0.1087488055229187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,32,power_law_1.2,0.1525760054588318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,32,power_law_1.2,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,32,power_law_1.2,0.3446784019470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,1,balanced,18.280277252197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,32,power_law_1.2,0.39034879207611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,1,balanced,21.14303970336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,32,power_law_1.2,0.744652795791626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,1,balanced,29.847381591796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,1,balanced,23.148033142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,32,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,32,power_law_1.2,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,32,power_law_1.2,0.22814719676971434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,1,balanced,22.61230977376302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,32,power_law_1.2,0.13066240549087524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,32,power_law_1.2,0.1679360032081604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,32,power_law_1.2,0.2297663927078247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,32,power_law_1.2,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,32,power_law_1.2,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,32,power_law_1.2,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,32,power_law_1.2,0.24860799312591553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,32,power_law_1.2,0.25436160564422605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,32,power_law_1.2,0.25496320724487304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,32,power_law_1.2,0.25804800987243653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,32,power_law_1.2,0.25229439735412595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,32,power_law_1.2,0.9621503829956055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,32,power_law_1.2,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,32,power_law_1.2,0.27648000717163085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,32,power_law_1.2,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,32,power_law_1.2,0.3135488033294678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,32,power_law_1.2,0.43479042053222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,32,power_law_1.2,0.5777408123016358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,32,power_law_1.2,0.6203392028808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,32,power_law_1.2,0.8364031791687012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,1,balanced,30.868138631184895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,32,power_law_1.2,1.1266048431396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,1,balanced,0.07901866734027863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,1,balanced,0.28142933050791424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,1,balanced,0.535370667775472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,1,balanced,1.039189338684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,1,balanced,2.037077267964681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,1,balanced,30.950398763020832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,1,balanced,4.037290573120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,1,balanced,6.022144317626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,1,balanced,6.031701405843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,32,power_law_1.2,1.8886655807495116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,1,balanced,6.052346547444661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,32,power_law_1.2,1.600921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,1,balanced,6.0706132253011065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,1,balanced,6.10321044921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,1,balanced,6.129834493001302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,1,balanced,39.01730092366537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,1,balanced,6.160725275675456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,1,balanced,6.232400258382161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,1,balanced,6.292133331298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,1,balanced,6.333610534667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,1,balanced,6.4368642171223955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,1,balanced,6.658901214599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,1,balanced,7.0060373942057295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,1,balanced,7.403167724609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,1,balanced,7.822506586710612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,1,balanced,8.770037333170572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,1,balanced,9.599487940470377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,1,balanced,11.676500956217447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,1,balanced,13.61355209350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,32,power_law_1.2,2.974105644226074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,1,balanced,17.806507110595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,1,balanced,21.380777994791668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,32,power_law_1.2,3.379404830932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,32,power_law_1.2,2.2937599182128907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,4,power_law_1.01,0.5910336017608643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,4,power_law_1.01,1.0430463790893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,4,power_law_1.01,1.1390975952148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,4,power_law_1.01,1.5880191802978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,4,power_law_1.01,1.6465791702270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,4,power_law_1.01,2.352511978149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,4,power_law_1.01,2.3431167602539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,4,power_law_1.01,2.537651252746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,4,power_law_1.01,2.43240966796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,4,power_law_1.01,2.6091455459594726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,4,power_law_1.01,2.5620479583740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,4,power_law_1.01,2.587238311767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,4,power_law_1.01,2.594611167907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,4,power_law_1.01,2.720358467102051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,4,power_law_1.01,2.920038414001465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,4,power_law_1.01,2.8368896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,4,power_law_1.01,2.931884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,4,power_law_1.01,3.114803123474121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,4,power_law_1.01,3.2866302490234376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,4,power_law_1.01,3.4136062622070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,4,power_law_1.01,3.7910526275634764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,4,power_law_1.01,4.564787292480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,4,power_law_1.01,4.8658302307128904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,4,power_law_1.01,6.282444763183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,32,power_law_1.2,4.7355903625488285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,4,power_law_1.01,7.938457489013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,4,power_law_1.01,12.792588806152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,4,power_law_1.01,13.780551147460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,64,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,64,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,64,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,64,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,64,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,64,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,64,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,64,power_law_1.01,0.05609599947929382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,64,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,64,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,64,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,64,power_law_1.01,0.061401599645614625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,64,power_law_1.01,0.062041598558425906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,64,power_law_1.01,0.08414720296859741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,64,power_law_1.01,0.0997376024723053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,64,power_law_1.01,0.132096004486084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,64,power_law_1.01,0.16650240421295165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,64,power_law_1.01,0.20111360549926757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,64,power_law_1.01,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,64,power_law_1.01,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,64,power_law_1.01,0.33648641109466554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,64,power_law_1.01,0.4544511795043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,64,power_law_1.01,0.6096896171569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,64,power_law_1.01,0.9052160263061524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,64,power_law_1.01,1.299251174926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,64,power_law_1.01,2.0305919647216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,64,power_law_1.01,2.568806457519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,64,power_law_1.2,0.3147775888442993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,64,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,64,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,64,power_law_1.2,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,64,power_law_1.2,0.1802240014076233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,64,power_law_1.2,0.17408000230789183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,64,power_law_1.2,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,64,power_law_1.2,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,64,power_law_1.2,0.2582528114318848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,64,power_law_1.2,0.25128960609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,64,power_law_1.2,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,64,power_law_1.2,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,64,power_law_1.2,0.2875391960144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,64,power_law_1.2,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,64,power_law_1.2,0.3127295970916748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,64,power_law_1.2,0.3000319957733154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,64,power_law_1.2,0.3452928066253662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,64,power_law_1.2,0.35880959033966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,64,power_law_1.2,0.4296703815460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,64,power_law_1.2,0.5244927883148194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,64,power_law_1.2,0.582860803604126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,64,power_law_1.2,0.8667136192321777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,64,power_law_1.2,1.1485183715820313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,64,power_law_1.2,2.0717567443847655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,64,power_law_1.2,2.2368255615234376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,64,power_law_1.2,3.355238342285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,64,power_law_1.2,4.754630279541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,1,balanced,0.33536001046498615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,1,balanced,0.5693440039952596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,1,balanced,1.1031893094380696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,1,balanced,2.164906660715739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,1,balanced,4.301994641621907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,1,balanced,5.327871958414714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,1,balanced,5.351935704549153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,1,balanced,5.369514465332031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,1,balanced,5.39134407043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,1,balanced,5.406874974568685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,1,balanced,5.445802688598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,1,balanced,5.480106353759766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,1,balanced,5.507925033569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,1,balanced,5.561855951944987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,1,balanced,5.616810480753581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,1,balanced,5.6685225168863935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,1,balanced,5.766656239827474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,1,balanced,5.966677347819011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,1,balanced,6.148096084594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,1,balanced,6.81881586710612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,1,balanced,6.857727686564128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,1,balanced,7.482197443644206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,1,balanced,8.175615946451822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,1,balanced,9.845077514648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,1,balanced,12.338858286539713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,1,balanced,18.351786295572918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,1,balanced,23.34941864013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,32,power_law_1.01,0.5974016189575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,32,power_law_1.01,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,32,power_law_1.01,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,32,power_law_1.01,0.5447616100311279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,32,power_law_1.01,0.504422378540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,32,power_law_1.01,0.47329277992248536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,32,power_law_1.01,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,32,power_law_1.01,0.51179518699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,32,power_law_1.01,0.527564811706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,32,power_law_1.01,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,32,power_law_1.01,0.4941823959350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,32,power_law_1.01,0.5513152122497559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,32,power_law_1.01,0.5414912223815918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,32,power_law_1.01,0.5556223869323731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,32,power_law_1.01,0.5355519771575927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,32,power_law_1.01,0.5818367958068847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,32,power_law_1.01,0.5730303764343262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,32,power_law_1.01,0.587775993347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,32,power_law_1.01,0.6723584175109864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,32,power_law_1.01,0.71495680809021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,32,power_law_1.01,0.8472576141357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,32,power_law_1.01,1.0133503913879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,32,power_law_1.01,1.1579392433166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,32,power_law_1.01,1.8925567626953126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,32,power_law_1.01,2.305023956298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,32,power_law_1.01,2.8999679565429686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,32,power_law_1.01,4.437811279296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,8,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,8,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,8,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,8,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,8,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,8,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,8,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,8,power_law_1.2,0.03150720000267029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,8,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,8,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,8,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,8,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,8,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,8,power_law_1.2,0.042156800627708435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,8,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,8,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,8,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,8,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,8,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,8,power_law_1.2,0.16732159852981568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,8,power_law_1.2,0.28037118911743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,8,power_law_1.2,0.37355520725250246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,8,power_law_1.2,0.6706880092620849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,8,power_law_1.2,1.0463104248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,16,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,16,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,16,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,16,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,16,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,16,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,16,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,16,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,16,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,16,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,16,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,16,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,16,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,16,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,16,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,16,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,16,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,16,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,16,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,4,balanced,0.07234666744867961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,4,balanced,0.3051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,4,balanced,0.5905066728591919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,4,balanced,1.1161493460337322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,4,balanced,2.174773375193278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,16,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,4,balanced,2.77128537495931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,16,power_law_1.2,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,16,power_law_1.2,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,4,balanced,2.7789653142293296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,4,balanced,2.727253278096517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,16,power_law_1.2,0.20869119167327882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,4,balanced,2.731861432393392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,4,balanced,2.7386560440063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,4,balanced,2.745685259501139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,4,balanced,2.758634567260742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,4,balanced,2.7757228215535483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,8,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,16,power_law_1.2,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,8,power_law_1.01,0.16609280109405516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,4,balanced,2.798762639363607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,8,power_law_1.01,0.24531838893890381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,4,balanced,2.8235092163085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,8,power_law_1.01,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,8,power_law_1.01,0.26972160339355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,4,balanced,2.916693369547526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,8,power_law_1.01,0.30392320156097413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,8,power_law_1.01,0.31784958839416505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,4,balanced,2.9552586873372397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,8,power_law_1.01,0.318668794631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,4,balanced,3.0218238830566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,8,power_law_1.01,0.3147775888442993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,8,power_law_1.01,0.3053567886352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,4,balanced,3.079850514729818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,8,power_law_1.01,0.31293439865112305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,8,power_law_1.01,0.3151808023452759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,8,power_law_1.01,0.33607680797576905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,4,balanced,3.449343999226888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,8,power_law_1.01,0.34689280986785886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,8,power_law_1.01,0.3264512062072754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,4,balanced,3.238400141398112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,8,power_law_1.01,0.342630410194397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,8,power_law_1.01,0.37457919120788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,8,power_law_1.01,0.3737600088119507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,4,balanced,3.5225601196289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,8,power_law_1.01,0.3952640056610107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,8,power_law_1.01,0.4104191780090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,4,balanced,3.8251520792643228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,8,power_law_1.01,0.45155839920043944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,8,power_law_1.01,0.5410816192626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,8,power_law_1.01,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,4,balanced,4.5696001052856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,8,power_law_1.01,0.9752575874328613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,8,power_law_1.01,1.192307186126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,4,balanced,6.077269236246745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,8,power_law_1.01,1.7688575744628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,8,power_law_1.01,2.214092826843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,4,balanced,7.984469095865886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,8,power_law_1.2,1.642265510559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,4,balanced,10.203477223714193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,16,power_law_1.2,0.3848191976547241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,8,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,8,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,8,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,8,power_law_1.01,0.0530239999294281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,8,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,8,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,8,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,8,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,8,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,8,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,8,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,16,power_law_1.2,0.6053887844085694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,8,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,8,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,8,power_law_1.01,0.1052672028541565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,8,power_law_1.01,0.09502720236778259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,8,power_law_1.01,0.1320639967918396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,8,power_law_1.01,0.1550336003303528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,8,power_law_1.01,0.2355072021484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,8,power_law_1.01,0.26620800495147706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,8,power_law_1.01,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,8,power_law_1.01,0.39502720832824706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,8,power_law_1.01,0.5429247856140137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,8,power_law_1.01,0.7366655826568603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,8,power_law_1.01,1.1778047561645508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,8,power_law_1.01,1.7174528121948243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,8,power_law_1.01,2.630656051635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,8,power_law_1.01,3.323699188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,16,power_law_1.2,0.951910400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,8,power_law_1.2,2.3846912384033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,4,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,4,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,4,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,4,balanced,0.28296534220377606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,4,balanced,0.5329920053482056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,4,balanced,1.0262080033620198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,4,balanced,1.5139840443929036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,4,balanced,1.5187625885009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,4,balanced,1.5235412915547688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,4,balanced,1.5278080304463704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,4,balanced,1.5370240211486816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,4,balanced,1.5467519760131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,4,balanced,1.553749402364095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,4,balanced,1.5713280042012532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,4,balanced,1.5892480214436848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,4,balanced,1.60426664352417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,4,balanced,1.633962631225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,4,balanced,1.6911360422770183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,4,balanced,1.7495039304097493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,4,balanced,1.8471253712972004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,4,balanced,1.9585706392923992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,4,balanced,2.2010879516601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,4,balanced,2.4258559544881186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,4,balanced,2.9755732218424478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,4,balanced,3.4957653681437173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,4,balanced,4.638719876607259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,4,balanced,5.780821482340495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,2,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,2,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,2,power_law_1.2,0.2617343902587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,2,power_law_1.2,0.36186881065368653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,2,power_law_1.2,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,2,power_law_1.2,0.7018496036529541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,2,power_law_1.2,0.8488960266113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,2,power_law_1.2,1.012326431274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,2,power_law_1.2,1.025216007232666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,2,power_law_1.2,1.1339776039123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,2,power_law_1.2,1.1546624183654786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,2,power_law_1.2,1.2677120208740233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,2,power_law_1.2,1.2726143836975097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,2,power_law_1.2,1.3240320205688476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,2,power_law_1.2,1.3279232025146483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,2,power_law_1.2,1.3948927879333497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,2,power_law_1.2,1.4366720199584961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,2,power_law_1.2,1.618534469604492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,2,power_law_1.2,1.763532829284668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,2,power_law_1.2,1.9752960205078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,2,power_law_1.2,2.229452705383301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,2,power_law_1.2,2.7072511672973634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,2,power_law_1.2,3.1309823989868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,2,power_law_1.2,4.049100875854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,2,power_law_1.2,5.126348876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,2,power_law_1.2,6.845849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,2,power_law_1.2,9.235865783691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,128,power_law_1.01,0.03929600119590759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,128,power_law_1.01,0.03808639943599701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,128,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,128,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,128,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,128,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,128,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,128,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,128,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,128,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,128,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,128,power_law_1.01,0.044633600115776065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,128,power_law_1.01,0.04503040015697479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,128,power_law_1.01,0.04688000082969666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,128,power_law_1.01,0.04973439872264862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,128,power_law_1.01,0.05057280063629151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,128,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,128,power_law_1.01,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,128,power_law_1.01,0.09584640264511109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,128,power_law_1.01,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,128,power_law_1.01,0.14026880264282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,128,power_law_1.01,0.1968127965927124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,128,power_law_1.01,0.21544959545135497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,128,power_law_1.01,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,128,power_law_1.01,0.4353792190551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,128,power_law_1.01,0.7792640209197998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,16,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,16,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,16,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,128,power_law_1.01,1.127014446258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,16,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,16,power_law_1.2,0.05978879928588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,16,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,16,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,16,power_law_1.2,0.06307200193405152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,16,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,16,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,16,power_law_1.2,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,16,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,16,power_law_1.2,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,16,power_law_1.2,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,16,power_law_1.2,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,16,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,16,power_law_1.2,0.12940160036087037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,16,power_law_1.2,0.18921600580215453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,16,power_law_1.2,0.2076672077178955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,16,power_law_1.2,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,16,power_law_1.2,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,16,power_law_1.2,0.4587520122528076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,16,power_law_1.2,0.715334415435791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,16,power_law_1.2,1.1563008308410645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,16,power_law_1.2,1.567948818206787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,16,power_law_1.2,2.36810245513916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,16,power_law_1.2,2.9853696823120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,8,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,8,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,8,balanced,0.05681600173314413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,8,balanced,0.2943893273671468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,8,balanced,0.5379199981689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,8,balanced,1.032533327738444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,8,balanced,1.0374826590220134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,8,balanced,1.0397013028462727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,8,balanced,1.042944033940633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,8,balanced,1.0444800059000652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,8,balanced,1.0490880012512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,8,balanced,1.0803199609120686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,8,balanced,1.0625706513722737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,8,balanced,1.0711039702097576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,8,balanced,1.0849173069000244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,8,balanced,1.0941440264383953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,8,balanced,1.1136000156402588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,8,balanced,1.1520000298817952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,8,balanced,1.191765308380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,8,balanced,1.2625919977823894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,8,balanced,1.3428053855895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,8,balanced,1.4779733022054036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,8,balanced,1.6404479344685872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,8,balanced,1.9531092643737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,8,balanced,2.4065705935160318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,8,balanced,3.297621409098307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,8,balanced,4.18065071105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,32,power_law_1.2,0.4020224094390869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,32,power_law_1.2,0.37969920635223386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,32,power_law_1.2,0.3788800001144409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,32,power_law_1.2,0.33955841064453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,32,power_law_1.2,0.29859840869903564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,32,power_law_1.2,0.3547136068344116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,32,power_law_1.2,0.34283521175384524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,32,power_law_1.2,0.3448832035064697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,32,power_law_1.2,0.37416958808898926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,32,power_law_1.2,0.3616767883300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,32,power_law_1.2,0.3983360052108765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,32,power_law_1.2,0.39813120365142823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,32,power_law_1.2,0.4098048210144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,32,power_law_1.2,0.41021437644958497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,32,power_law_1.2,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,32,power_law_1.2,0.40468478202819824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,32,power_law_1.2,0.46694397926330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,32,power_law_1.2,0.5511168003082275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,32,power_law_1.2,0.5709824085235595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,32,power_law_1.2,0.7258111953735351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,32,power_law_1.2,0.908902359008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,32,power_law_1.2,1.4774271965026855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,32,power_law_1.2,1.6697343826293944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,32,power_law_1.2,2.4031232833862304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,32,power_law_1.2,3.4562049865722657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,8,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,8,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,8,balanced,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,8,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,8,balanced,0.02609066665172577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,8,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,8,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,8,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,8,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,8,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,8,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,8,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,8,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,8,balanced,0.03344533344109853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,8,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,8,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,8,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,8,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,8,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,8,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,8,balanced,0.06518933176994324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,8,balanced,0.07202133536338806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,8,balanced,0.10393599669138591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,8,balanced,0.16401066382726034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,8,balanced,0.26504000027974445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,8,balanced,0.35174401601155597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,8,balanced,0.5278720060984293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,8,balanced,0.23688532908757529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,8,balanced,0.2387626568476359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,8,balanced,0.23944532871246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,8,balanced,0.7026346524556478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,8,balanced,0.23995733261108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,8,balanced,0.24132267634073892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,8,balanced,0.24200000365575156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,8,balanced,0.244053324063619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,32,power_law_1.2,4.645068740844726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,8,balanced,0.24541866779327393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,8,balanced,0.24728000164031982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,8,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,8,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,8,balanced,0.2600959936777751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,8,balanced,0.26691200335820514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,8,balanced,0.28142400582631427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,8,balanced,0.29371732473373413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,8,balanced,0.30719999472300213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,8,balanced,0.34065067768096924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,8,balanced,0.43110398451487225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,8,balanced,0.46967466672261554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,8,balanced,0.7115093072255453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,8,balanced,0.9204053084055582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,8,balanced,1.4197759628295898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,8,balanced,1.82476806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,32,power_law_1.2,6.290220642089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,1,balanced,1.7698133786519368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,1,balanced,3.5012213389078775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,1,balanced,6.926165262858073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,1,balanced,6.96012814839681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,1,balanced,6.981119791666667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,1,balanced,6.959615707397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,1,balanced,6.974122365315755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,1,balanced,7.010133107503255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,1,balanced,7.250773111979167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,1,balanced,7.293952306111653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,1,balanced,7.347370783487956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,1,balanced,7.388330459594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,1,balanced,7.4246826171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,1,balanced,7.500458399454753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,1,balanced,12.003669738769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,1,balanced,12.199595133463541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,1,balanced,12.319061279296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,1,balanced,17.65171178181966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,1,balanced,21.53369649251302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,1,balanced,27.351552327473957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,1,balanced,32.69614919026693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,1,balanced,39.472981770833336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,1,balanced,45.170003255208336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,1,balanced,57.907368977864586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,1,balanced,71.13557434082031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.5341184139251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.7927807807922364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,1,power_law_1.01,1.0461183547973634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,1,power_law_1.01,1.4682111740112305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,1,power_law_1.01,1.533132839202881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,1,power_law_1.01,1.6189376831054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,1,power_law_1.01,1.660108757019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,1,power_law_1.01,1.7367040634155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,1,power_law_1.01,1.8550783157348634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,1,power_law_1.01,1.8872320175170898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,1,power_law_1.01,1.9705856323242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,1,power_law_1.01,2.0344831466674806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,1,power_law_1.01,2.1116928100585937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,1,power_law_1.01,2.2120447158813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,1,power_law_1.01,2.471718406677246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,1,power_law_1.01,2.7430912017822267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,1,balanced,95.68887329101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,1,power_law_1.01,3.1510528564453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,1,power_law_1.01,3.5723262786865235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,1,power_law_1.01,4.499660873413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,1,power_law_1.01,5.371903991699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,1,power_law_1.01,7.29333724975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,1,power_law_1.01,9.1146240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,4,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,4,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,4,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,4,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,4,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,4,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,4,power_law_1.01,0.027820798754692077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,4,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,4,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,4,power_law_1.01,0.030291199684143066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,4,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,4,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,4,power_law_1.01,0.039103999733924866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,1,power_law_1.01,13.021388244628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,4,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,4,power_law_1.01,0.05957760214805603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,4,power_law_1.01,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,4,power_law_1.01,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,4,power_law_1.01,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,1,power_law_1.01,16.924467468261717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,4,power_law_1.01,0.1478656053543091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,128,balanced,0.04914666712284088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,128,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,128,balanced,0.046394666035970054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,4,power_law_1.01,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,128,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,128,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,128,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,128,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,128,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,128,balanced,0.056320001681645714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,128,balanced,0.05649066468079885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,128,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,128,balanced,0.05989866455396017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,128,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,128,balanced,0.06465599934260051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,128,balanced,0.08226133386294048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,128,balanced,0.11895466844240825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,128,balanced,0.1713493267695109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,128,balanced,0.21435733636220297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,128,balanced,0.22835199038187662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,128,balanced,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,128,balanced,0.3126613299051921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,128,balanced,0.3826346794764201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,128,balanced,0.45602134863535565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,128,balanced,0.6446079810460409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,128,balanced,0.7949653466542562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,128,balanced,1.1482453346252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,1,balanced,117.35601806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,128,balanced,1.508522669474284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,4,power_law_1.01,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,4,power_law_1.01,0.46918401718139646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,4,power_law_1.01,0.715776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,4,power_law_1.01,0.9074687957763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,4,power_law_1.01,1.6343040466308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,2,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,2,power_law_1.01,0.19780479669570922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,2,power_law_1.01,0.27729918956756594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,2,power_law_1.01,0.39792640209198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,2,power_law_1.01,0.5289984226226807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,2,power_law_1.01,0.768614387512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,2,power_law_1.01,0.7659520149230957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,2,power_law_1.01,0.8226816177368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,2,power_law_1.01,0.8706048011779786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,2,power_law_1.01,0.8503168106079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,2,power_law_1.01,0.8638463973999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,2,power_law_1.01,0.8972288131713867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,2,power_law_1.01,0.912384033203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,2,power_law_1.01,0.8896512031555176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,2,power_law_1.01,0.936736011505127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,2,power_law_1.01,0.9623552322387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,2,power_law_1.01,0.9943039894104004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,2,power_law_1.01,1.102233600616455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,2,power_law_1.01,1.1220992088317872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,2,power_law_1.01,1.326899242401123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,2,power_law_1.01,1.4731264114379883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,2,power_law_1.01,1.9499008178710937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,2,power_law_1.01,2.0770816802978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,2,power_law_1.01,2.9745151519775392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,2,power_law_1.01,3.564134216308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,2,power_law_1.01,5.144166564941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,16,balanced,0.019626667102177937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,16,balanced,0.019968000551064808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,16,balanced,0.019626667102177937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,16,balanced,0.020303999384244282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,16,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,16,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,16,balanced,0.022175999979178112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,16,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,16,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,16,balanced,0.022357332209746044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,16,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,16,balanced,0.023365333676338196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,16,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,16,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,16,balanced,0.02916266769170761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,16,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,16,balanced,0.03190399954716364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,16,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,16,balanced,0.038373333712418876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,16,balanced,0.067071999112765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,16,balanced,0.06758399804433186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,16,balanced,0.11008000373840332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,2,power_law_1.01,6.683628845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,16,balanced,0.13414399822553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,16,balanced,0.27613866329193115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,4,power_law_1.01,2.000486373901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,16,balanced,0.3633493185043335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,32,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,32,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,32,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,32,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,32,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,32,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,32,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,32,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,32,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,32,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,32,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,32,balanced,0.03292799989382426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,32,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,32,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,32,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,32,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,32,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,32,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,32,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,32,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,32,balanced,0.06297599772612254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,32,balanced,0.1037600040435791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,32,balanced,0.105813334385554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,32,balanced,0.23841599623362222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,32,balanced,0.2955946723620097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,32,balanced,0.4602880080540975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,32,balanced,0.5841919978459676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,2,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,2,balanced,0.0890880028406779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,2,balanced,0.30856533845265705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,2,balanced,0.5763413508733114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,2,balanced,1.102336009343465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,2,balanced,1.371989409128825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,2,balanced,1.3808639844258626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,2,balanced,1.385642687479655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,2,balanced,1.3933226267496746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,2,balanced,1.3991252581278484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,2,balanced,1.412266731262207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,2,balanced,1.4243839581807454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,2,balanced,1.435306708017985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,2,balanced,1.4549333254496257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,2,balanced,1.4791679382324219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,2,balanced,1.497429370880127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,2,balanced,1.5400959650675456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,2,balanced,1.6230400403340657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,2,balanced,1.7003520329793294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,2,balanced,1.881600062052409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,2,balanced,2.032128016153971
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,2,balanced,2.372437318166097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,2,balanced,2.7195733388264975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,2,balanced,3.4658985137939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,2,balanced,4.3064320882161455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,2,balanced,6.158506393432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,2,balanced,8.176981608072916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.5916672229766846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,1,power_law_1.01,1.0493951797485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,1,power_law_1.01,2.0367359161376952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,1,power_law_1.01,4.040089416503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,1,power_law_1.01,7.406169891357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,1,power_law_1.01,10.25945587158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,1,power_law_1.01,11.860787200927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,1,power_law_1.01,16.077005004882814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,1,power_law_1.01,16.268902587890626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,1,power_law_1.01,16.879615783691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,1,power_law_1.01,17.66871032714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,1,power_law_1.01,18.32263641357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,1,power_law_1.01,18.9517822265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,1,power_law_1.01,19.566181945800782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,1,power_law_1.01,19.482623291015624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,8,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,8,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,8,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,8,balanced,0.02932800104220708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,8,balanced,0.030192000170548756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,8,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,8,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,8,balanced,0.03225066761175791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,8,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,8,balanced,0.03378133227427801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,8,balanced,0.037178667883078255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,8,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,8,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,8,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,8,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,8,balanced,0.06502399841944377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,8,balanced,0.07987200220425923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,8,balanced,0.20718934138615927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,1,power_law_1.01,20.802764892578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,8,balanced,0.274944007396698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,8,balanced,0.40226133664449054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,8,balanced,0.579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,8,balanced,0.9838773409525553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,8,balanced,1.3747199376424153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,1,power_law_1.01,21.723545837402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,1,power_law_1.01,23.261798095703124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,1,power_law_1.01,23.329177856445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,1,power_law_1.01,24.923135375976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,1,power_law_1.01,26.7335693359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,2,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,2,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,2,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,2,power_law_1.01,0.1622015953063965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,2,power_law_1.01,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,2,power_law_1.01,0.28876800537109376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,2,power_law_1.01,0.4112383842468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,2,power_law_1.01,0.4282368183135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,2,power_law_1.01,0.4472832202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,2,power_law_1.01,0.4632575988769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,2,power_law_1.01,0.49397759437561034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,2,power_law_1.01,0.481279993057251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,2,power_law_1.01,0.520192003250122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,1,power_law_1.01,28.938430786132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,2,power_law_1.01,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,2,power_law_1.01,0.5644288063049316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,2,power_law_1.01,0.5793791770935058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,2,power_law_1.01,0.6391808032989502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,2,power_law_1.01,0.7192512035369873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,2,power_law_1.01,0.8380415916442872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,2,power_law_1.01,1.0510335922241212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,8,power_law_1.01,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,8,power_law_1.01,0.35082240104675294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,2,power_law_1.01,1.1876352310180665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,8,power_law_1.01,0.2869247913360596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,8,power_law_1.01,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,2,power_law_1.01,1.6625663757324218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,8,power_law_1.01,0.3852288007736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,8,power_law_1.01,0.44851198196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,2,power_law_1.01,2.0801536560058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,2,power_law_1.01,2.8813312530517576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,8,power_law_1.01,0.4491263866424561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,8,power_law_1.01,0.4671487808227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,8,power_law_1.01,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,8,power_law_1.01,0.46387200355529784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,1,power_law_1.01,30.9376953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,2,power_law_1.01,3.6098049163818358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,8,power_law_1.01,0.4603903770446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,8,power_law_1.01,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,8,power_law_1.01,0.46898560523986815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,8,power_law_1.01,0.4831232070922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,8,power_law_1.01,0.47964158058166506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,8,power_law_1.01,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,2,power_law_1.01,5.427609634399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,8,power_law_1.01,0.4843264102935791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,8,power_law_1.01,0.5066624164581299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,8,power_law_1.01,0.5400576114654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,8,power_law_1.01,0.6240255832672119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,8,power_law_1.01,0.6975488185882568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,8,power_law_1.01,0.8460288047790527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,2,power_law_1.01,7.332864379882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,8,power_law_1.01,1.0393600463867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,8,power_law_1.01,1.449350357055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,8,power_law_1.01,1.6465919494628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,8,power_law_1.01,2.0762624740600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,8,power_law_1.01,2.7793407440185547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,1,power_law_1.01,37.04954833984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,1,power_law_1.01,42.03376770019531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,1,power_law_1.01,54.56404418945313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,16,power_law_1.2,0.19144959449768068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,16,power_law_1.2,0.34447360038757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,16,power_law_1.2,0.33771519660949706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,16,power_law_1.2,0.35408639907836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,16,power_law_1.2,0.3516416072845459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,16,power_law_1.2,0.265011191368103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,16,power_law_1.2,0.3053567886352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,16,power_law_1.2,0.2762495994567871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,16,power_law_1.2,0.33564159870147703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,16,power_law_1.2,0.32522239685058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,16,power_law_1.2,0.3512063980102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,16,power_law_1.2,0.3280895948410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,16,power_law_1.2,0.34549760818481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,16,power_law_1.2,0.3358720064163208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,16,power_law_1.2,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,16,power_law_1.2,0.3477504014968872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,16,power_law_1.2,0.35676159858703616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,16,power_law_1.2,0.3969023942947388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,16,power_law_1.2,0.4065279960632324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,16,power_law_1.2,0.4704256057739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,1,power_law_1.01,53.2580322265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,16,power_law_1.2,0.5263360023498536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,16,power_law_1.2,0.6498239994049072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,16,power_law_1.2,0.815494441986084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,16,power_law_1.2,1.0887167930603028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,16,power_law_1.2,1.2677120208740233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,16,power_law_1.2,1.9253248214721679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,16,power_law_1.2,2.4922111511230467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,32,power_law_1.2,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,32,power_law_1.2,0.02088959962129593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,32,power_law_1.2,0.02088959962129593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,32,power_law_1.2,0.02129279971122742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,32,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,32,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,32,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,32,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,32,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,32,power_law_1.2,0.027641600370407103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,32,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,32,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,32,power_law_1.2,0.039724799990653994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,16,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,32,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,32,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,16,power_law_1.2,0.1632256031036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,32,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,16,power_law_1.2,0.09071360230445862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,32,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,32,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,16,power_law_1.2,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,32,power_law_1.2,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,16,power_law_1.2,0.19537919759750366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,32,power_law_1.2,0.11796480417251587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,32,power_law_1.2,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,16,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,16,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,16,power_law_1.2,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,16,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,16,power_law_1.2,0.0997376024723053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,16,power_law_1.2,0.13598719835281373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,16,power_law_1.2,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,16,power_law_1.2,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,16,power_law_1.2,0.1679360032081604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,16,power_law_1.2,0.1755136013031006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,16,power_law_1.2,0.19742720127105712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,16,power_law_1.2,0.20787200927734376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,16,power_law_1.2,0.22220799922943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,16,power_law_1.2,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,16,power_law_1.2,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,16,power_law_1.2,0.3186624050140381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,16,power_law_1.2,0.38686718940734866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,16,power_law_1.2,0.44892158508300783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,16,power_law_1.2,0.638976001739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,16,power_law_1.2,0.9639936447143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,16,power_law_1.2,1.3291520118713378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,32,power_law_1.2,0.15749119520187377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,16,power_law_1.2,1.7979391098022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,32,power_law_1.2,0.369049596786499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,32,power_law_1.2,0.4118527889251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,32,power_law_1.2,0.5910528182983399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,128,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,128,balanced,0.04385066529115041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,128,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,128,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,128,balanced,0.036320000886917114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,128,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,128,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,128,balanced,0.03872533390919367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,128,balanced,0.03889599939187368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,128,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,128,balanced,0.03923733284076055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,128,balanced,0.04043733328580856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,128,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,128,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,128,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,128,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,128,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,128,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,128,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,128,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,128,balanced,0.07934933404127757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,128,balanced,0.10052266716957092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,128,balanced,0.1295360028743744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,128,balanced,0.2728959918022156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,128,balanced,0.3457706769307454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,128,balanced,0.5159253279368082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,128,balanced,0.6918826897939047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,32,power_law_1.2,1.01396484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,4,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,4,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,4,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,4,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,4,power_law_1.01,0.03275519907474518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,4,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,4,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,4,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,4,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,4,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,4,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,4,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,4,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,4,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,4,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,4,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,4,power_law_1.01,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,4,power_law_1.01,0.09152640104293823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,4,power_law_1.01,0.1912832021713257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,4,power_law_1.01,0.2549760103225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,4,power_law_1.01,0.3565567970275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,4,power_law_1.01,0.5013504028320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,4,power_law_1.01,0.8517631530761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,4,power_law_1.01,1.0803199768066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,4,power_law_1.01,1.966489601135254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,1,power_law_1.01,0.4063231945037842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,1,power_law_1.01,0.7507967948913574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,4,power_law_1.01,2.7197439193725588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,1,power_law_1.01,1.42293119430542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,1,power_law_1.01,2.494054412841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,1,power_law_1.01,3.620044708251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,1,power_law_1.01,6.042828750610352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,1,power_law_1.01,6.418841552734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,1,power_law_1.01,6.628761291503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,1,power_law_1.01,6.782566070556641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,1,power_law_1.01,6.917324829101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,1,power_law_1.01,7.250739288330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,1,power_law_1.01,7.413555145263672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,1,power_law_1.01,7.488921356201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,1,power_law_1.01,7.712153625488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,1,power_law_1.01,7.968972778320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,1,power_law_1.01,8.099635314941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,1,power_law_1.01,8.330854034423828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,1,power_law_1.01,8.788582611083985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,1,power_law_1.01,9.311846160888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,1,power_law_1.01,10.139647674560546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,32,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,32,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,32,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,32,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,32,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,32,balanced,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,32,balanced,0.30003199974695843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,32,balanced,0.30139732360839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,32,balanced,0.3036160071690877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,32,balanced,0.30481066306432086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,32,balanced,0.30190932750701904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,32,balanced,0.30429865916570026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,32,balanced,0.30771199862162274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,32,balanced,0.31249066193898517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,32,balanced,0.3198293248812358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,32,balanced,0.32477867603302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,32,balanced,0.3351893424987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,32,balanced,0.35839998722076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,32,balanced,0.3920106490453084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,32,balanced,0.4380906820297241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,1,power_law_1.01,10.826751708984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,32,balanced,0.47650134563446045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,32,balanced,0.5406719843546549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,32,balanced,0.6145706574122111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,32,balanced,0.8272213141123453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,32,balanced,1.0364586512247722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,32,balanced,1.46943998336792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,32,balanced,1.8990079561869304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,1,power_law_1.01,12.93516845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,1,power_law_1.01,14.073855590820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,1,power_law_1.01,17.848287963867186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,1,power_law_1.01,20.792697143554687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,1,power_law_1.01,28.277145385742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,1,power_law_1.01,36.17054748535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,2,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,2,balanced,0.21009065707524618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,2,balanced,0.3927040100097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,2,balanced,0.7517600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,2,balanced,1.413610617319743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,2,balanced,2.041173299153646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,2,balanced,2.0519253412882485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,2,balanced,2.063530604044596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,2,balanced,2.073088010152181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,2,balanced,2.0860586166381836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,2,balanced,2.1061760584513345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,2,balanced,2.125114599863688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,2,balanced,2.1428906122843423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,2,balanced,2.179413318634033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,2,balanced,2.216266632080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,2,balanced,2.247327963511149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,2,balanced,2.3145813941955566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,2,balanced,2.447872002919515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,2,balanced,2.580138683319092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,2,balanced,2.8779519399007163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,2,balanced,3.142810821533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,2,balanced,3.6995414098103843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,2,balanced,4.249600092569987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,2,balanced,5.334527969360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,2,balanced,6.5762983957926435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,2,balanced,9.2315305074056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,2,balanced,12.242261250813803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,32,power_law_1.01,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,32,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,32,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,32,power_law_1.01,0.052799999713897705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,32,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,32,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,32,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,32,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,32,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,32,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,32,power_law_1.01,0.05794559717178345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,32,power_law_1.01,0.06447359919548035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,32,power_law_1.01,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,32,power_law_1.01,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,32,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,32,power_law_1.01,0.14581120014190674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,32,power_law_1.01,0.13373440504074097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,32,power_law_1.01,0.21974399089813232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,32,power_law_1.01,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,32,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,32,power_law_1.01,0.34283521175384524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,32,power_law_1.01,0.44748802185058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,32,power_law_1.01,0.5863423824310303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,32,power_law_1.01,0.8419136047363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,32,power_law_1.01,1.1808768272399903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,32,power_law_1.01,1.9533824920654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,32,power_law_1.01,2.3418880462646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,2,balanced,0.311296006043752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,2,balanced,0.5290666818618774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,2,balanced,1.0373120307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,2,balanced,2.0706987380981445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,2,balanced,4.079445203145345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,2,balanced,7.951018651326497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,2,balanced,7.9639892578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,2,balanced,8.028330485026041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,2,balanced,8.039253234863281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,2,balanced,8.052223841349283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,2,balanced,8.029183705647787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,2,balanced,8.057173411051432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,2,balanced,8.08294423421224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,2,balanced,8.112639745076498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,2,balanced,8.159231821695963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,2,balanced,8.202410380045572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,2,balanced,8.31112543741862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,2,balanced,8.69324811299642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,2,balanced,8.893952051798502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,2,balanced,9.163775761922201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,2,balanced,10.068480173746744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,2,balanced,12.519765218098959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,16,power_law_1.01,0.1937280058860779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,16,power_law_1.01,0.2510848045349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,16,power_law_1.01,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,16,power_law_1.01,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,16,power_law_1.01,0.13946880102157594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,16,power_law_1.01,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,16,power_law_1.01,0.23695359230041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,16,power_law_1.01,0.2033600091934204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,2,balanced,11.026432037353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,16,power_law_1.01,0.2289664030075073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,16,power_law_1.01,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,16,power_law_1.01,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,16,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,16,power_law_1.01,0.2506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,16,power_law_1.01,0.25169920921325684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,16,power_law_1.01,0.2676480054855347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,16,power_law_1.01,0.26169600486755373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,16,power_law_1.01,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,2,balanced,11.492863972981771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,16,power_law_1.01,0.27031679153442384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,16,power_law_1.01,0.29982719421386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,16,power_law_1.01,0.30310399532318116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,16,power_law_1.01,0.3762176036834717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,16,power_law_1.01,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,16,power_law_1.01,0.5132287979125977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,16,power_law_1.01,0.6955008029937744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,16,power_law_1.01,1.0168319702148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,2,balanced,13.875882466634115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,16,power_law_1.01,1.4325759887695313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,16,power_law_1.01,1.7270784378051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,2,balanced,15.789226531982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,2,balanced,19.436203002929688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,8,balanced,0.06894933183987935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,8,balanced,0.2855253418286641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,8,balanced,0.5376000006993612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,8,balanced,1.053866704305013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,8,balanced,2.032810688018799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,8,balanced,4.0122025807698565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,8,balanced,6.006783803304036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,8,balanced,6.0031998952229815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,8,balanced,6.005077362060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,8,balanced,6.01258659362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,128,balanced,0.044010668992996216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,128,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,128,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,128,balanced,0.03804266701141993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,128,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,128,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,128,balanced,0.04043733328580856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,128,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,128,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,128,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,128,balanced,0.04195199906826019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,128,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,128,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,128,balanced,0.04453866680463155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,8,balanced,6.0170237223307295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,128,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,128,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,128,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,128,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,128,balanced,0.060218666990598045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,128,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,128,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,128,balanced,0.12627733747164407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,128,balanced,0.11912533640861511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,8,balanced,6.02998415629069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,128,balanced,0.2111039956410726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,128,balanced,0.27852799495061237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,128,balanced,0.4118186632792155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,8,balanced,6.041088104248047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,128,balanced,0.49595733483632404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,8,balanced,6.058666865030925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,8,balanced,6.079317092895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,8,balanced,6.088191986083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,8,balanced,6.121130625406901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,8,balanced,6.199296315511067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,8,balanced,6.419455846150716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,8,balanced,6.5655466715494795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,8,balanced,6.707706451416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,8,balanced,6.920517603556315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,8,balanced,7.956480026245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,8,balanced,8.354986826578775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,8,balanced,8.8896853129069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,8,balanced,10.381807963053385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,8,balanced,10.71240488688151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,4,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,4,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,4,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,4,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,4,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,4,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,4,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,4,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,4,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,4,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,4,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,4,balanced,0.027813332776228588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,4,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,4,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,4,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,4,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,4,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,4,balanced,0.049141332507133484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,4,balanced,0.06997333467006683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,4,balanced,0.07679999868075053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,4,balanced,0.11639466881752014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,4,balanced,0.2326186696688334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,4,balanced,0.35259731610616046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,4,balanced,0.4642133315404256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,4,balanced,0.7321600119272867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,4,balanced,1.0134186744689941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,1,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,1,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,1,balanced,0.08516266942024231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,1,balanced,0.3068586587905884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,1,balanced,0.5705333153406779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,1,balanced,0.710314671198527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,1,balanced,0.7195306619008383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,1,balanced,0.7263573010762533
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,1,balanced,0.7348906993865967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,1,balanced,0.7425706386566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,1,balanced,0.7575893402099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,1,balanced,0.773973306020101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,1,balanced,0.7871146996816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,1,balanced,0.8171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,1,balanced,0.8487199942270914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,1,balanced,0.8797866503397623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,1,balanced,0.9362773100535074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,1,balanced,1.0680320262908936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,1,balanced,1.2054133415222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,1,balanced,1.5810559590657551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,1,balanced,1.7745919227600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,1,balanced,2.346325397491455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,1,balanced,2.9223200480143228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,1,balanced,4.0697065989176435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,1,balanced,5.347487767537435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,1,balanced,7.925418853759766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,1,balanced,10.432682673136393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,32,power_law_1.2,0.3158015966415405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,32,power_law_1.2,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,32,power_law_1.2,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,32,power_law_1.2,0.2770944118499756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,32,power_law_1.2,0.22753279209136962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,32,power_law_1.2,0.16936960220336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,32,power_law_1.2,0.2461695909500122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,32,power_law_1.2,0.24309759140014647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,32,power_law_1.2,0.25661439895629884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,32,power_law_1.2,0.24227840900421144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,32,power_law_1.2,0.26808319091796873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,32,power_law_1.2,0.28487679958343504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,32,power_law_1.2,0.2795520067214966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,32,power_law_1.2,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,32,power_law_1.2,0.2885632038116455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,32,power_law_1.2,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,32,power_law_1.2,0.3086335897445679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,32,power_law_1.2,0.34283521175384524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,32,power_law_1.2,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,32,power_law_1.2,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,32,power_law_1.2,0.5035967826843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,32,power_law_1.2,0.7170048236846924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,32,power_law_1.2,0.8980480194091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,32,power_law_1.2,1.3877247810363769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,32,power_law_1.2,1.8216960906982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,32,power_law_1.2,2.8262399673461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,32,power_law_1.2,3.8637313842773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,32,power_law_1.01,0.7243775844573974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,32,power_law_1.01,0.7241471767425537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,32,power_law_1.01,0.7260159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,32,power_law_1.01,0.6711296081542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,32,power_law_1.01,0.6469632148742676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,32,power_law_1.01,0.6758399963378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,32,power_law_1.01,0.7051263809204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,32,power_law_1.01,0.6803455829620362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,32,power_law_1.01,0.708403205871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,32,power_law_1.01,0.7087744235992431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,32,power_law_1.01,0.7194623947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,32,power_law_1.01,0.7235583782196044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,32,power_law_1.01,0.7626751899719239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,32,power_law_1.01,0.7475200176239014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,32,power_law_1.01,0.8636159896850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,32,power_law_1.01,0.8716287612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,32,power_law_1.01,0.7997439861297607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,32,power_law_1.01,1.0334207534790039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,32,power_law_1.01,0.9293824195861816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,32,power_law_1.01,1.1405311584472657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,32,power_law_1.01,1.6295936584472657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,32,power_law_1.01,2.1581823348999025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,32,power_law_1.01,2.144870376586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,32,power_law_1.01,2.8700672149658204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,32,power_law_1.01,4.459110260009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,32,power_law_1.01,5.988966369628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,32,power_law_1.01,8.108812713623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,8,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,8,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,8,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,8,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,8,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,8,power_law_1.2,0.1286080002784729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,8,power_law_1.2,0.1478656053543091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,8,power_law_1.2,0.10219520330429077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,8,power_law_1.2,0.06552960276603699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,8,power_law_1.2,0.10301439762115479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,8,power_law_1.2,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,8,power_law_1.2,0.09969919919967651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,8,power_law_1.2,0.107315194606781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,8,power_law_1.2,0.15400960445404052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,8,power_law_1.2,0.1667072057723999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,8,power_law_1.2,0.18431999683380126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,8,power_law_1.2,0.19148800373077393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,8,power_law_1.2,0.20480000972747803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,8,power_law_1.2,0.21543679237365723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,8,power_law_1.2,0.24391679763793944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,8,power_law_1.2,0.26908159255981445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,8,power_law_1.2,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,8,power_law_1.2,0.45217280387878417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,8,power_law_1.2,0.705728006362915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,8,power_law_1.2,0.9805631637573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,8,power_law_1.2,1.6977920532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,8,power_law_1.2,1.8720767974853516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,128,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,128,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,128,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,128,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,128,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,128,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,128,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,128,power_law_1.2,0.030713599920272828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,128,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,128,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,128,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,128,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,128,power_law_1.2,0.035411199927330016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,128,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,128,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,128,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,128,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,128,power_law_1.2,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,128,power_law_1.2,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,128,power_law_1.2,0.16998399496078492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,128,power_law_1.2,0.2664448022842407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,128,power_law_1.2,0.4579328060150146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,128,power_law_1.2,0.5332992076873779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,128,power_law_1.2,0.8038399696350098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,128,power_law_1.2,1.1814911842346192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,128,power_law_1.2,1.859379196166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,64,power_law_1.2,0.036236798763275145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,64,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,64,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,64,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,64,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,64,power_law_1.2,0.02597759962081909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,64,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,64,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,64,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,64,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,64,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,64,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,64,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,64,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,64,power_law_1.2,0.04747520089149475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,64,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,64,power_law_1.2,0.11878399848937989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,64,power_law_1.2,0.11796480417251587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,64,power_law_1.2,0.15749119520187377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,64,power_law_1.2,0.31395840644836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,64,power_law_1.2,0.3817471981048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,64,power_law_1.2,0.6766592025756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,64,power_law_1.2,0.9443327903747558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,128,power_law_1.01,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,128,power_law_1.01,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,128,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,128,power_law_1.01,0.020070399343967437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,128,power_law_1.01,0.020275199413299562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,128,power_law_1.01,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,128,power_law_1.01,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,16,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,128,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,128,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,128,power_law_1.01,0.025798401236534117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,128,power_law_1.01,0.02661119997501373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,128,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,128,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,128,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,16,balanced,0.04010133445262909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,128,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,128,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,128,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,128,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,128,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,128,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,128,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,16,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,128,power_law_1.01,0.09338880181312562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,128,power_law_1.01,0.11263999938964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,128,power_law_1.01,0.1581055998802185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,128,power_law_1.01,0.23900160789489747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,128,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,16,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,16,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,16,balanced,0.04573333263397217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,16,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,128,power_law_1.01,0.5388288021087646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,16,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,16,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,16,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,16,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,16,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,16,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,16,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,16,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,16,balanced,0.06877866884072621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,16,balanced,0.07321600119272868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,16,balanced,0.09897599617640178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,16,balanced,0.1735573410987854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,16,balanced,0.2868853410085042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,16,balanced,0.40089599291483563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,16,balanced,0.5560319821039835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,16,balanced,0.7579306761423746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,16,balanced,1.148586670557658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,16,balanced,1.5837866465250652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,128,power_law_1.2,2.7052032470703127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,4,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,4,balanced,0.055125330885251365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,4,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,4,balanced,0.2764799992243449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,4,balanced,0.5338453451792399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,4,balanced,1.030997355779012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,4,balanced,1.5342933336893718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,4,balanced,1.537706693013509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,4,balanced,1.5436800320943196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,4,balanced,1.5481173197428386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,4,balanced,1.558186690012614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,4,balanced,1.569610595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,4,balanced,1.5737172762552898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,4,balanced,1.5822505950927734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,4,balanced,1.60426664352417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,4,balanced,1.6174079577128093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,4,balanced,1.6501760482788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,4,balanced,1.711957295735677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,4,balanced,1.799850622812907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,4,balanced,1.9148799578348796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,4,balanced,2.0456107457478843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,4,balanced,2.3203840255737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,4,balanced,2.5724587440490723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,4,balanced,3.171669324239095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,4,balanced,3.6730880737304688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,4,balanced,4.902741432189941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,4,balanced,6.130005518595378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.5486400127410889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,1,power_law_1.01,1.0340352058410645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,1,power_law_1.01,2.0860927581787108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,1,power_law_1.01,3.0842880249023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,1,power_law_1.01,4.104396820068359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,1,power_law_1.01,5.8718208312988285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,1,power_law_1.01,6.141132736206055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,1,power_law_1.01,6.405734252929688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,1,power_law_1.01,6.432768249511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,1,power_law_1.01,6.547046661376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,1,power_law_1.01,6.812262725830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,1,power_law_1.01,7.100211334228516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,1,power_law_1.01,7.255244445800781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,1,power_law_1.01,7.5608062744140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,1,power_law_1.01,7.748198699951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,1,power_law_1.01,8.058656311035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,1,power_law_1.01,8.690278625488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,1,power_law_1.01,8.903065490722657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,32,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,32,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,32,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,32,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,32,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,32,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,32,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,1,power_law_1.01,9.45950698852539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,32,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,32,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,32,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,32,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,32,balanced,0.0327360009153684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,32,balanced,0.03310399999221166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,32,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,32,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,32,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,32,balanced,0.04794133206208547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,32,balanced,0.054602667689323425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,32,balanced,0.07063999772071838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,32,balanced,0.16759467124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,32,balanced,0.2872320016225179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,32,balanced,0.370688001314799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,1,power_law_1.01,9.894297790527343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,32,balanced,0.6000639994939169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,32,balanced,0.808789332707723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,1,power_law_1.01,11.289804840087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,1,power_law_1.01,12.296371459960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,1,power_law_1.01,15.452755737304688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,1,power_law_1.01,17.28143310546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,1,power_law_1.01,22.83458557128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,1,power_law_1.01,28.390579223632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,4,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,4,power_law_1.01,0.28733439445495607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,4,power_law_1.01,0.5433343887329102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,4,power_law_1.01,0.5152768135070801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,4,power_law_1.01,0.7690239906311035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,4,power_law_1.01,0.9889792442321778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,4,power_law_1.01,0.9062399864196777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,4,power_law_1.01,1.3344767570495606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,4,power_law_1.01,1.3619199752807618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,4,power_law_1.01,1.1853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,4,power_law_1.01,1.2820480346679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,4,power_law_1.01,1.3094911575317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,4,power_law_1.01,1.338368034362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,4,power_law_1.01,1.3107199668884277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,4,power_law_1.01,1.3766655921936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,4,power_law_1.01,1.4174207687377929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,4,power_law_1.01,1.4598143577575684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,4,power_law_1.01,1.6052223205566407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,4,power_law_1.01,1.618534469604492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,4,power_law_1.01,1.8311168670654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,4,power_law_1.01,1.925939178466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,4,power_law_1.01,2.332467269897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,4,power_law_1.01,2.668339157104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,128,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,128,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,4,power_law_1.01,3.403776168823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,128,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,128,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,128,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,4,power_law_1.01,3.943423843383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,128,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,128,power_law_1.01,0.05406079888343811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,128,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,128,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,4,power_law_1.01,5.694054412841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,128,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,128,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,128,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,128,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,128,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,128,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,4,power_law_1.01,7.017881774902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,128,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,128,power_law_1.01,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,128,power_law_1.01,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,128,power_law_1.01,0.14315520524978637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,128,power_law_1.01,0.24145920276641847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,128,power_law_1.01,0.321126389503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,128,power_law_1.01,0.41840639114379885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,128,power_law_1.01,0.5369855880737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,128,power_law_1.01,0.8892416000366211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,128,power_law_1.01,1.1653120040893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,128,power_law_1.01,1.7965055465698243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,128,power_law_1.01,2.367897605895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,8,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,8,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,8,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,8,power_law_1.01,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,8,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,8,power_law_1.01,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,8,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,8,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,8,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,8,power_law_1.01,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,8,power_law_1.01,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,8,power_law_1.01,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,8,power_law_1.01,0.13701119422912597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,8,power_law_1.01,0.12963839769363403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,8,power_law_1.01,0.1703935980796814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,8,power_law_1.01,0.22691841125488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,8,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,8,power_law_1.01,0.3268608093261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,8,power_law_1.01,0.3848191976547241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,8,power_law_1.01,0.709222412109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,8,power_law_1.01,0.9099264144897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,8,power_law_1.01,1.2007424354553222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,8,power_law_1.01,1.6513023376464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,8,power_law_1.01,2.5610240936279296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,8,power_law_1.01,3.4469886779785157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,8,power_law_1.01,5.076582336425782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,8,power_law_1.01,5.679103851318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,32,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,32,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,32,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,32,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,32,power_law_1.01,0.03088639974594116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,32,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,32,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,32,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,32,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,32,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,32,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,32,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,32,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,32,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,32,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,32,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,32,power_law_1.01,0.0710591971874237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,32,power_law_1.01,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,32,power_law_1.01,0.1253376007080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,32,power_law_1.01,0.15664000511169435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,32,power_law_1.01,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,32,power_law_1.01,0.33136639595031736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,32,power_law_1.01,0.5984255790710449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,32,power_law_1.01,0.6133759975433349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,32,power_law_1.01,1.0655743598937988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,32,power_law_1.01,1.7528831481933593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,16,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,16,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,16,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,16,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,16,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,16,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,16,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,16,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,16,power_law_1.01,0.03644160032272339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,16,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,16,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,16,power_law_1.01,0.04689280092716217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,16,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,16,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,16,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,16,power_law_1.01,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,16,power_law_1.01,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,16,power_law_1.01,0.15196160078048707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,16,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,16,power_law_1.01,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,16,power_law_1.01,0.36884479522705077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,16,power_law_1.01,0.46284799575805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,16,power_law_1.01,0.7421951770782471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,16,power_law_1.01,1.0465279579162599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,16,power_law_1.01,1.7920000076293945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,16,power_law_1.01,2.1786624908447267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,8,power_law_1.01,0.21831679344177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,8,power_law_1.01,0.393830394744873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,8,power_law_1.01,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,8,power_law_1.01,0.3907583951950073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,8,power_law_1.01,0.49930238723754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,8,power_law_1.01,0.5150720119476319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,8,power_law_1.01,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,8,power_law_1.01,0.47656960487365724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,8,power_law_1.01,0.4958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,8,power_law_1.01,0.4990719795227051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,8,power_law_1.01,0.49315838813781737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,8,power_law_1.01,0.5177343845367431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,8,power_law_1.01,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,8,power_law_1.01,0.5509119987487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,8,power_law_1.01,0.5500927925109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,8,power_law_1.01,0.5720064163208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,8,power_law_1.01,0.6080512046813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,8,power_law_1.01,0.6459392070770263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,8,power_law_1.01,0.7155712127685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,8,power_law_1.01,0.8095744132995606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,8,power_law_1.01,0.9721856117248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,8,power_law_1.01,1.1988991737365722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,8,power_law_1.01,1.4106623649597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,8,power_law_1.01,1.8946048736572265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,8,power_law_1.01,2.5403392791748045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,8,power_law_1.01,3.5133438110351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,8,power_law_1.01,4.8037761688232425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,64,power_law_1.2,0.46346240043640136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,64,power_law_1.2,0.41635842323303224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,64,power_law_1.2,0.41656317710876467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,64,power_law_1.2,0.4136960029602051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,64,power_law_1.2,0.3768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,64,power_law_1.2,0.39444479942321775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,64,power_law_1.2,0.3147775888442993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,64,power_law_1.2,0.42086400985717776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,64,power_law_1.2,0.3960832118988037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,64,power_law_1.2,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,64,power_law_1.2,0.40181760787963866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,64,power_law_1.2,0.39137279987335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,64,power_law_1.2,0.4069375991821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,64,power_law_1.2,0.40508160591125486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,64,power_law_1.2,0.38010880947113035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,64,power_law_1.2,0.4079616069793701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,64,power_law_1.2,0.4603903770446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,64,power_law_1.2,0.4433919906616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,64,power_law_1.2,0.5179391860961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,64,power_law_1.2,0.5326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,64,power_law_1.2,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,64,power_law_1.2,0.9820159912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,64,power_law_1.2,1.0297344207763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,64,power_law_1.2,1.448140811920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,64,power_law_1.2,2.229452705383301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,64,power_law_1.2,3.2974849700927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,64,power_law_1.2,3.9438335418701174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,32,power_law_1.2,1.0733440399169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,32,power_law_1.2,1.0706944465637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,32,power_law_1.2,1.064140796661377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,32,power_law_1.2,1.0702848434448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,32,power_law_1.2,0.9904128074645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,32,power_law_1.2,0.9967616081237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,32,power_law_1.2,0.9791487693786621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,32,power_law_1.2,0.9383935928344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,32,power_law_1.2,0.9418751716613769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,32,power_law_1.2,0.9545727729797363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,32,power_law_1.2,0.9869312286376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,32,power_law_1.2,0.9998335838317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,32,power_law_1.2,1.0172224044799805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,32,power_law_1.2,1.0502143859863282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,32,power_law_1.2,1.0653696060180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,32,power_law_1.2,1.1157504081726075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,32,power_law_1.2,1.1401151657104491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,32,power_law_1.2,1.2273664474487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,32,power_law_1.2,1.2611583709716796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,32,power_law_1.2,1.7334272384643554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,32,power_law_1.2,1.823744010925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,32,power_law_1.2,2.614886474609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,32,power_law_1.2,2.710323143005371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,32,power_law_1.2,3.6743167877197265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,32,power_law_1.2,5.054668807983399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,32,power_law_1.2,6.533529663085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,32,power_law_1.2,7.642111968994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,1,power_law_1.01,0.527564811706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,1,power_law_1.01,0.8839167594909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,1,power_law_1.01,1.075814437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,1,power_law_1.01,2.0604736328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,1,power_law_1.01,2.015212821960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,1,power_law_1.01,2.0002815246582033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,1,power_law_1.01,2.0566015243530273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,1,power_law_1.01,2.0758527755737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,1,power_law_1.01,2.085887908935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,1,power_law_1.01,2.16760311126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,1,power_law_1.01,2.307891273498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,1,power_law_1.01,2.404966354370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,1,power_law_1.01,2.450841522216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,1,power_law_1.01,2.490777587890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,1,power_law_1.01,2.6294271469116213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,1,power_law_1.01,2.816204833984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,1,power_law_1.01,3.1066112518310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,1,power_law_1.01,3.771596908569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,1,power_law_1.01,4.117094421386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.1662976026535034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.25231359004974363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,1,power_law_1.01,5.119379043579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.4073472023010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.43765759468078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.4433919906616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.46305279731750487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.47902722358703614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.48435201644897463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.4976640224456787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,1,power_law_1.01,5.822054290771485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.5287936210632325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.5492735862731933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.5541696071624755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.6062079906463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.7081984043121338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.8142848014831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,1,power_law_1.01,1.0672127723693847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,1,power_law_1.01,1.2933119773864745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,1,power_law_1.01,1.7780736923217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,1,power_law_1.01,2.2585344314575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,1,power_law_1.01,3.319193649291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,1,power_law_1.01,4.356915283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,1,power_law_1.01,6.5185791015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,1,power_law_1.01,8.67675552368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,1,power_law_1.01,7.666073608398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,1,power_law_1.01,9.64874267578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,1,power_law_1.01,13.491813659667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,4,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,4,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,4,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,4,balanced,0.02712533374627431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,4,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,4,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,4,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,4,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,4,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,4,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,4,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,4,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,4,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,4,balanced,0.031727999448776245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,4,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,4,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,4,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,4,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,4,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,4,balanced,0.0911253293355306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,4,balanced,0.10443733135859172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,4,balanced,0.1858560045560201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,4,balanced,0.2882560094197591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,4,balanced,0.4196693499883016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,4,balanced,0.5681493282318115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,4,balanced,0.8944640159606934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,4,balanced,1.2209493319193523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,1,power_law_1.01,18.560000610351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,8,power_law_1.2,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,8,power_law_1.2,0.04423039853572845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,8,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,8,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,8,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,8,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,8,power_law_1.2,0.07475200295448303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,8,power_law_1.2,0.07596799731254578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,8,power_law_1.2,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,8,power_law_1.2,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,8,power_law_1.2,0.12840960025787354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,8,power_law_1.2,0.1435647964477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,8,power_law_1.2,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,8,power_law_1.2,0.22669439315795897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,8,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,8,power_law_1.2,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,8,power_law_1.2,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,8,power_law_1.2,0.790118408203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,8,power_law_1.2,1.0569727897644043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,8,power_law_1.2,1.656012725830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,1,power_law_1.01,26.57750549316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,8,power_law_1.2,2.190719985961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,8,power_law_1.2,3.0496768951416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,1,power_law_1.01,34.241946411132815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,8,power_law_1.2,4.324140930175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,8,power_law_1.2,5.54332160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,8,power_law_1.01,0.03274880051612854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,8,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,8,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,8,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,8,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,8,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,8,power_law_1.01,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,8,power_law_1.01,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,8,power_law_1.01,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,8,power_law_1.01,0.10629119873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,8,power_law_1.01,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,8,power_law_1.01,0.16179200410842895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,8,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,8,power_law_1.01,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,8,power_law_1.01,0.49745922088623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,8,power_law_1.01,0.677888011932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,8,power_law_1.01,0.9797632217407226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,8,power_law_1.2,7.818854522705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,8,power_law_1.01,1.66297607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,8,power_law_1.01,2.085478401184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,4,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,4,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,4,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,4,balanced,0.2850133379300435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,4,balanced,0.5420373280843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,4,balanced,0.5464640061060587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,4,balanced,0.5505706469217936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,4,balanced,0.5536426703135172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,4,balanced,0.5555200179417928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,4,balanced,0.5550080140431722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,4,balanced,0.5635413328806559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,4,balanced,0.570026675860087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,4,balanced,0.575488011042277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,4,balanced,0.5881173213322958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,4,balanced,0.6000639994939169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,4,balanced,0.6290773153305054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,4,balanced,0.6790826320648193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,4,balanced,0.7246507008870443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,4,balanced,0.8113493124643961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,4,balanced,0.9074347019195557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,4,balanced,1.1422719955444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,4,balanced,1.3815466562906902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,4,balanced,1.9083946545918782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,4,balanced,2.486442724863688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,4,balanced,3.552768071492513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,4,balanced,4.653738657633464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,8,power_law_1.01,3.2346111297607423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,8,power_law_1.01,4.389888000488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,2,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,2,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,2,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,2,power_law_1.2,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,2,power_law_1.2,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,2,power_law_1.2,0.11980799436569214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,2,power_law_1.2,0.214630389213562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,2,power_law_1.2,0.23203840255737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,2,power_law_1.2,0.2500607967376709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,2,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,2,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,2,power_law_1.2,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,2,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,2,power_law_1.2,0.3158015966415405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,2,power_law_1.2,0.3231744050979614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,2,power_law_1.2,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,2,power_law_1.2,0.3794944047927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,2,power_law_1.2,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,2,power_law_1.2,0.528166389465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,2,power_law_1.2,0.7557119846343994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,2,power_law_1.2,0.9414655685424804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,2,power_law_1.2,1.3064191818237305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,2,power_law_1.2,1.8249727249145509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,2,power_law_1.2,2.6171392440795898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,2,power_law_1.2,3.6382720947265623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,2,power_law_1.2,5.6573951721191404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,2,power_law_1.2,7.016652679443359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,2,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,2,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,2,power_law_1.01,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,2,power_law_1.01,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,2,power_law_1.01,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,2,power_law_1.01,0.39976959228515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,2,power_law_1.01,0.4014080047607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,2,power_law_1.01,0.4118527889251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,2,power_law_1.01,0.42270717620849607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,2,power_law_1.01,0.43294720649719237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,2,power_law_1.01,0.42741761207580564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,2,power_law_1.01,0.4554751873016357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,2,power_law_1.01,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,2,power_law_1.01,0.47450881004333495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,2,power_law_1.01,0.48906240463256834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,2,power_law_1.01,0.4868095874786377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,2,power_law_1.01,0.47411198616027833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,2,power_law_1.01,0.5099520206451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,2,power_law_1.01,0.5459968090057373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,2,power_law_1.01,0.633843183517456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,2,power_law_1.01,0.6610943794250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,2,power_law_1.01,0.8732671737670898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,2,power_law_1.01,1.0295295715332031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,2,power_law_1.01,1.4053376197814942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,2,power_law_1.01,1.7528831481933593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,2,power_law_1.01,2.577408027648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,2,power_law_1.01,3.362406539916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,1,power_law_1.2,0.7485119819641113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,1,power_law_1.2,1.419264030456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,1,power_law_1.2,2.792448043823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,1,power_law_1.2,4.4179328918457035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,1,power_law_1.2,6.2531585693359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,1,power_law_1.2,11.76965103149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,1,power_law_1.2,12.670950317382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,1,power_law_1.2,13.249331665039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,1,power_law_1.2,13.697407531738282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,1,power_law_1.2,13.984768676757813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,1,power_law_1.2,14.318797302246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,1,power_law_1.2,14.746829223632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,1,power_law_1.2,15.273779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,1,power_law_1.2,15.942451477050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,1,power_law_1.2,16.148684692382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,1,power_law_1.2,16.298188781738283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,1,power_law_1.2,16.693247985839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,1,power_law_1.2,17.5278076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,1,power_law_1.2,17.882521057128905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,1,power_law_1.2,19.128115844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,1,power_law_1.2,20.92974090576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,128,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,128,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,128,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,128,power_law_1.2,0.0239424005150795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,128,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,128,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,128,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,128,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,128,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,128,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,128,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,128,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,128,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,128,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,128,power_law_1.2,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,128,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,128,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,128,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,128,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,128,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,128,power_law_1.2,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,1,power_law_1.2,24.115199279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,128,power_law_1.2,0.11263999938964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,128,power_law_1.2,0.14274560213088988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,128,power_law_1.2,0.3010560035705566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,128,power_law_1.2,0.4335616111755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,128,power_law_1.2,0.6918144226074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,1,power_law_1.2,26.653900146484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,1,power_law_1.2,33.72520446777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,1,power_law_1.2,38.72133178710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,128,power_law_1.2,0.9428799629211426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,16,power_law_1.2,0.5675007820129394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,16,power_law_1.2,1.0346495628356933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,16,power_law_1.2,1.325875186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,16,power_law_1.2,1.4735360145568848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,16,power_law_1.2,1.5200127601623534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,16,power_law_1.2,1.4993408203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,2,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,2,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,2,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,2,balanced,0.0646666685740153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,16,power_law_1.2,1.368883228302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,2,balanced,0.2855253418286641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,2,balanced,0.5358933210372925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,2,balanced,0.5408106644948324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,2,balanced,0.547978679339091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,16,power_law_1.2,1.2023807525634767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,2,balanced,0.5548373460769653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,2,balanced,0.5573973258336385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,2,balanced,0.5669546524683634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,2,balanced,0.5776906808217367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,16,power_law_1.2,1.265459156036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,2,balanced,0.5860693454742432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,2,balanced,0.6010880072911581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,2,balanced,0.6212266683578491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,2,balanced,0.6391466856002808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,16,power_law_1.2,1.1827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,2,balanced,0.6787412961324056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,2,balanced,0.7492266496022543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,2,balanced,0.8483520348866781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,16,power_law_1.2,1.2517375946044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,2,balanced,1.0047146479288738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,16,power_law_1.2,1.2816384315490723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,2,balanced,1.192618687947591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,2,balanced,1.5626239776611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,16,power_law_1.2,1.2527615547180175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,2,balanced,1.942186673482259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,16,power_law_1.2,1.263206386566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,2,balanced,2.720933278401693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,16,power_law_1.2,1.3516799926757812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,16,power_law_1.2,1.4655488014221192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,2,balanced,3.578709284464518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,16,power_law_1.2,1.4458880424499512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,1,power_law_1.2,51.086099243164064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,16,power_law_1.2,1.5333248138427735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,2,balanced,5.2718931833903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,16,power_law_1.2,1.5681535720825195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,16,power_law_1.2,1.743462371826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,2,balanced,6.990847905476888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,16,power_law_1.2,1.8817024230957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,16,power_law_1.2,2.27061767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,16,power_law_1.2,2.613043212890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,16,power_law_1.2,3.6175872802734377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,16,power_law_1.2,4.387417602539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,16,power_law_1.2,6.086860656738281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,16,power_law_1.2,6.890496063232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,1,power_law_1.2,64.25252075195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,2,balanced,0.4684799909591675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,2,balanced,0.9048746426900228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,2,balanced,1.8003627459208171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,2,balanced,1.7762986818949382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,2,balanced,1.777488072713216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,2,balanced,1.7817600568135579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,2,balanced,1.7885866165161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,2,balanced,1.798997402191162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,2,balanced,1.8493439356486003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,2,balanced,1.8582186698913574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,2,balanced,1.8742613792419434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,2,balanced,1.8916692733764648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,2,balanced,1.896447976430257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,2,balanced,1.9300692876180012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,2,balanced,2.943488121032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,2,balanced,2.9974187215169272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,2,balanced,3.069098790486654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,2,balanced,4.233557383219401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,2,balanced,5.127338727315267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,2,balanced,6.3633066813151045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,2,balanced,7.62333869934082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,2,balanced,9.16701889038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,2,balanced,10.92300796508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,2,balanced,14.112597147623697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,2,balanced,17.55733362833659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,2,balanced,23.037269592285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,2,balanced,28.601003011067707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,32,balanced,0.021333334346612293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,32,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,32,balanced,0.019968000551064808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,32,balanced,0.02065066620707512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,32,balanced,0.021477334201335907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,32,balanced,0.022175999979178112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,32,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,32,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,32,balanced,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,32,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,32,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,32,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,32,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,32,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,32,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,32,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,32,balanced,0.029861333469549816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,32,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,32,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,32,balanced,0.036506667733192444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,32,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,32,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,32,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,32,balanced,0.10103467106819153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,32,balanced,0.1104213297367096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,32,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,32,balanced,0.2943999965985616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,1,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,1,power_law_1.01,0.23838720321655274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,1,power_law_1.01,0.4472832202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,1,power_law_1.01,0.6807551860809327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,1,power_law_1.01,0.8767487525939941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,1,power_law_1.01,1.4380800247192382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,1,power_law_1.01,1.529651165008545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,1,power_law_1.01,1.5878144264221192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,1,power_law_1.01,1.5996928215026855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,1,power_law_1.01,1.663795280456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,1,power_law_1.01,1.6891904830932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,1,power_law_1.01,1.7149951934814454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,1,power_law_1.01,1.7872896194458008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,1,power_law_1.01,1.8114559173583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,1,power_law_1.01,1.8278335571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,1,power_law_1.01,1.822105598449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,1,power_law_1.01,1.9130367279052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,1,power_law_1.01,2.020966339111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,1,power_law_1.01,2.1413631439208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,1,power_law_1.01,2.387558364868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,1,power_law_1.01,2.6863616943359374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,1,power_law_1.01,3.2485374450683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,1,power_law_1.01,3.9471103668212892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,1,power_law_1.01,5.280972671508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,1,power_law_1.01,6.045491027832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,1,power_law_1.01,8.607743835449218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,1,power_law_1.01,11.250873565673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,8,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,8,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,8,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,8,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,8,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,8,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,8,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,8,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,8,power_law_1.01,0.042182400822639465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,8,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,8,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,8,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,8,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,8,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,8,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,8,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,8,power_law_1.01,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,8,power_law_1.01,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,8,power_law_1.01,0.2041599988937378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,8,power_law_1.01,0.2977792024612427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,8,power_law_1.01,0.4120448112487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,8,power_law_1.01,0.6438911914825439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,8,power_law_1.01,0.9732095718383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,8,power_law_1.01,1.3987839698791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,2,balanced,0.07577600081761678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,2,balanced,0.306005338827769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,2,balanced,0.5748053391774496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,2,balanced,1.1013120015462239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,2,balanced,2.161322593688965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,2,balanced,2.7356160481770835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,2,balanced,2.7487573623657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,2,balanced,2.708479881286621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,2,balanced,2.7175254821777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,2,balanced,2.7270825703938804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,2,balanced,2.7429545720418296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,2,balanced,2.7607040405273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,2,balanced,2.775893211364746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,2,balanced,2.8016640345255532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,2,balanced,2.8287998835245767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,2,balanced,2.8523521423339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,2,balanced,2.905429204305013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,2,balanced,3.007317225138346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,2,balanced,3.1086934407552085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,2,balanced,3.3174187342325845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,2,balanced,3.5271679560343423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,2,balanced,3.809109369913737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,2,balanced,4.221952120463054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,2,balanced,5.1249494552612305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,2,balanced,6.31278928120931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,2,balanced,9.195690790812174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,2,balanced,12.16818110148112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,1,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,1,power_law_1.2,0.0323199987411499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,1,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,1,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,1,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,1,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,1,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,1,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,1,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,1,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,1,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,1,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,1,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,1,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,1,power_law_1.2,0.08702719807624817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,1,power_law_1.2,0.1026047945022583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,1,power_law_1.2,0.15564800500869752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,1,power_law_1.2,0.214630389213562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,1,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,1,power_law_1.2,0.3229696035385132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,1,power_law_1.2,0.4206592082977295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,1,power_law_1.2,0.6254591941833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.5939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,1,power_law_1.01,1.1182080268859864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,1,power_law_1.01,2.18603515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,1,power_law_1.2,0.8556544303894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,1,power_law_1.01,3.685171127319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,1,power_law_1.01,4.966604614257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,1,power_law_1.01,8.341913604736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,1,power_law_1.01,8.802098846435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,1,power_law_1.01,9.172172546386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,1,power_law_1.01,9.568460845947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,1,power_law_1.01,9.506201934814452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,1,power_law_1.01,9.60491485595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,1,power_law_1.01,10.111795043945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,1,power_law_1.01,10.14681625366211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,1,power_law_1.01,10.763878631591798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,1,power_law_1.2,1.3676544189453126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,1,power_law_1.01,11.0487548828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,1,power_law_1.01,11.380941009521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,1,power_law_1.01,11.431526184082031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,1,power_law_1.01,12.072959899902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,1,power_law_1.01,12.538880157470704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,1,power_law_1.2,1.8737152099609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,1,power_law_1.01,13.7101318359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,1,power_law_1.01,14.59752960205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,1,power_law_1.01,17.439942932128908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,1,power_law_1.01,17.249273681640624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,1,power_law_1.01,21.681561279296876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,1,power_law_1.01,26.254949951171874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,1,power_law_1.01,34.676123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,1,power_law_1.2,2.91408634185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,1,power_law_1.01,44.033843994140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,1,power_law_1.2,3.930521774291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,8,power_law_1.2,1.4614527702331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,8,power_law_1.2,2.271846389770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,8,power_law_1.2,2.5991167068481444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,8,power_law_1.2,3.099033546447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,8,power_law_1.2,3.6759361267089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,8,power_law_1.2,3.8635520935058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,8,power_law_1.2,3.8739967346191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,8,power_law_1.2,3.649740982055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,8,power_law_1.2,3.645644760131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,8,power_law_1.2,3.747020721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,8,power_law_1.2,3.6741119384765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,8,power_law_1.2,3.792486572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,8,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,8,power_law_1.2,3.943423843383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,8,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,8,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,8,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,8,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,8,power_law_1.2,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,8,power_law_1.2,4.051968002319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,8,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,8,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,8,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,8,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,8,power_law_1.2,4.246118545532227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,8,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,8,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,8,power_law_1.2,0.05589759945869446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,8,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,8,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,8,power_law_1.2,0.08273919820785522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,8,power_law_1.2,4.22400016784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,8,power_law_1.2,0.1060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,8,power_law_1.2,0.1652735948562622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,8,power_law_1.2,0.24289278984069823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,8,power_law_1.2,0.30658559799194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,8,power_law_1.2,4.281958389282226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,8,power_law_1.2,4.3558910369873045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,8,power_law_1.2,4.732908630371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,8,power_law_1.2,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,8,power_law_1.2,5.060812759399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,8,power_law_1.2,5.721273422241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,8,power_law_1.2,7.233740997314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,8,power_law_1.2,7.036287689208985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,8,power_law_1.2,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,8,power_law_1.2,9.70813446044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,8,power_law_1.2,10.455014038085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,8,power_law_1.2,15.490663146972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,8,power_law_1.2,0.7809023857116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,8,power_law_1.2,1.3758463859558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,8,power_law_1.2,17.325465393066406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,8,power_law_1.2,1.6426944732666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,2,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,2,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,2,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,2,power_law_1.01,0.3565567970275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,2,power_law_1.01,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,2,power_law_1.01,0.5347263813018799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,2,power_law_1.01,0.816710376739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,2,power_law_1.01,0.8105983734130859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,2,power_law_1.01,0.8146944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,2,power_law_1.01,0.8970239639282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,2,power_law_1.01,0.8998911857604981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,2,power_law_1.01,0.942899227142334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,2,power_law_1.01,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,2,power_law_1.01,0.983238410949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,2,power_law_1.01,0.9885696411132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,2,power_law_1.01,1.057587242126465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,2,power_law_1.01,1.0891263961791993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,2,power_law_1.01,1.2288000106811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,2,power_law_1.01,1.299251174926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,2,power_law_1.01,1.5411199569702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,2,power_law_1.01,1.7729536056518556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,2,power_law_1.01,2.168217658996582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,2,power_law_1.01,2.5679807662963867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,2,power_law_1.01,3.4846721649169923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,2,power_law_1.01,4.463616180419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,2,power_law_1.01,6.178406524658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,2,power_law_1.01,7.871282958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,2,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,2,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,2,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,2,power_law_1.01,0.324403190612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,2,power_law_1.01,0.46346240043640136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,2,power_law_1.01,0.6176767826080323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,2,power_law_1.01,0.7565311908721923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,2,power_law_1.01,0.8079360008239747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,2,power_law_1.01,0.8273920059204102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,2,power_law_1.01,0.8888319969177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,2,power_law_1.01,0.9232383728027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,2,power_law_1.01,0.933683204650879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,2,power_law_1.01,0.983238410949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,2,power_law_1.01,1.0375167846679687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,2,power_law_1.01,1.0610688209533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,2,power_law_1.01,1.1032575607299804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,2,power_law_1.01,1.1249664306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,2,power_law_1.01,1.2668928146362304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,2,power_law_1.01,1.4012415885925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,2,power_law_1.01,1.6336896896362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,2,power_law_1.01,1.8310976028442383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,2,power_law_1.01,2.4424448013305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,2,power_law_1.01,2.812723159790039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,2,power_law_1.01,3.931545639038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,2,power_law_1.01,4.9717247009277346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,4,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,2,power_law_1.01,7.456153869628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,4,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,4,power_law_1.2,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,4,power_law_1.2,0.05610880255699158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,4,power_law_1.2,0.11427839994430541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,4,power_law_1.2,0.21441919803619386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,4,power_law_1.2,0.22446079254150392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,4,power_law_1.2,0.21790719032287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,4,power_law_1.2,0.2213887929916382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,4,power_law_1.2,0.23367679119110107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,4,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,8,power_law_1.2,0.5152768135070801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,2,power_law_1.01,9.543270111083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,4,power_law_1.2,0.2545664072036743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,8,power_law_1.2,0.4583424091339111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,4,power_law_1.2,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,8,power_law_1.2,0.46323838233947756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,4,power_law_1.2,0.26214399337768557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,8,power_law_1.2,0.46387200355529784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,8,power_law_1.2,0.46694397926330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,8,power_law_1.2,0.47124481201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,8,power_law_1.2,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,8,power_law_1.2,0.47861762046813966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,8,power_law_1.2,0.5478400230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,4,power_law_1.2,0.2617343902587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,8,power_law_1.2,0.7415808200836181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,4,power_law_1.2,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,4,power_law_1.2,0.265830397605896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,8,power_law_1.2,0.8126463890075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,4,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,8,power_law_1.2,0.9342975616455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,4,power_law_1.2,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,4,power_law_1.2,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,8,power_law_1.2,1.0170368194580077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,4,power_law_1.2,0.364134407043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,4,power_law_1.2,0.43929600715637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,8,power_law_1.2,0.953548812866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,4,power_law_1.2,0.6656000137329101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,4,power_law_1.2,0.9363391876220704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,8,power_law_1.2,1.2635775566101075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,4,power_law_1.2,1.0866687774658204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,8,power_law_1.2,1.2105728149414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,8,power_law_1.2,1.6025279998779296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,8,power_law_1.2,2.714828872680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,4,power_law_1.2,1.7438720703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,8,power_law_1.2,2.9536256790161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,8,power_law_1.2,3.7904384613037108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,4,power_law_1.2,2.525388717651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,8,power_law_1.2,5.419212722778321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,8,power_law_1.2,7.268147277832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,8,power_law_1.2,8.859238433837891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,8,power_law_1.2,12.494233703613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,1,power_law_1.01,0.5781504154205322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,1,power_law_1.01,1.0969087600708007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,1,power_law_1.01,2.1606399536132814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,1,power_law_1.01,3.3363967895507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,1,power_law_1.01,4.869734573364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,1,power_law_1.01,8.142233276367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,1,power_law_1.01,8.76337890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,1,power_law_1.01,8.858214569091796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,1,power_law_1.01,9.199616241455079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,1,power_law_1.01,9.42837142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,1,power_law_1.01,9.757901000976563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,1,power_law_1.01,9.89818878173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,1,power_law_1.01,10.091110229492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,1,power_law_1.01,10.330726623535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,8,power_law_1.2,15.267430114746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,1,power_law_1.01,10.622566223144531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,1,power_law_1.01,10.682572937011718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,1,power_law_1.01,10.994278717041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,1,power_law_1.01,11.439513397216796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,1,power_law_1.01,11.717017364501952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,1,power_law_1.01,12.463104248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,1,power_law_1.01,13.565728759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,1,power_law_1.01,15.34361572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,1,power_law_1.01,18.001919555664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,1,power_law_1.01,22.931660461425782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,1,power_law_1.01,27.573043823242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,8,power_law_1.2,22.68733367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,1,power_law_1.01,37.02742919921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,1,power_law_1.01,48.747109985351564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,8,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,8,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,8,power_law_1.01,0.23264639377593993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,8,power_law_1.01,0.25866239070892333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,8,power_law_1.01,0.34549760818481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,8,power_law_1.01,0.3280895948410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,8,power_law_1.01,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,8,power_law_1.01,0.3590143918991089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,8,power_law_1.01,0.3606528043746948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,8,power_law_1.01,0.34816000461578367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,8,power_law_1.01,0.37109758853912356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,8,power_law_1.01,0.38908801078796384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,8,power_law_1.01,0.3831808090209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,8,power_law_1.01,0.39137279987335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,8,power_law_1.01,0.4132863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,8,power_law_1.01,0.41635842323303224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,8,power_law_1.01,0.4349952220916748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,8,power_law_1.01,0.45752320289611814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,8,power_law_1.01,0.49496960639953613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,8,power_law_1.01,0.5496831893920898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,8,power_law_1.01,0.6856512069702149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,8,power_law_1.01,0.9666560173034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,8,power_law_1.01,1.1993087768554687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,8,power_law_1.01,1.5605631828308106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,8,power_law_1.01,2.0150272369384767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,8,power_law_1.01,3.0871551513671873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,8,power_law_1.01,4.319820785522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,8,power_law_1.2,28.798770141601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,2,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,2,power_law_1.2,0.030502399802207945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,2,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,2,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,2,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,2,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,2,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,2,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,2,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,2,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,2,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,2,power_law_1.2,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,2,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,2,power_law_1.2,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,2,power_law_1.2,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,2,power_law_1.2,0.11345920562744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,2,power_law_1.2,0.15011839866638182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,2,power_law_1.2,0.19967999458312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.9076736450195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,1,power_law_1.2,1.273203182220459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,1,power_law_1.2,1.78155517578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,1,power_law_1.2,3.345612716674805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,2,power_law_1.2,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,2,power_law_1.2,0.35184640884399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,1,power_law_1.2,3.530527877807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,1,power_law_1.2,3.5342334747314452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,1,power_law_1.2,3.8340606689453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,1,power_law_1.2,4.053196716308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,1,power_law_1.2,4.231167984008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,1,power_law_1.2,4.448255920410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,2,power_law_1.2,0.4511744022369385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,32,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,32,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,32,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,32,balanced,0.06005333364009857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,32,balanced,0.20138667027155557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,32,balanced,0.20241065820058188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,32,balanced,0.20292266209920248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,32,balanced,0.20377600193023682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,32,balanced,0.20514132579167685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,1,power_law_1.2,4.25984001159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,32,balanced,0.20718934138615927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,32,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,32,balanced,0.20889600118001303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,32,balanced,0.21145600080490112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,32,balanced,0.21555199225743613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,32,balanced,0.2206719915072123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,32,balanced,0.2261120080947876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,32,balanced,0.23654399315516153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,32,balanced,0.2461013396581014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,32,balanced,0.28074665864308673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,32,balanced,0.2918399969736735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,1,power_law_1.2,4.463411331176758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,32,balanced,0.3590826590855916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,32,balanced,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,32,balanced,0.4828159809112549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,32,balanced,0.6227626800537109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,1,power_law_1.2,4.681932830810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,32,balanced,0.9292799631754557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,32,balanced,1.2165119647979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,1,power_law_1.2,5.266432189941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,2,power_law_1.2,0.7065599918365478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,1,power_law_1.2,5.813036727905273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,1,power_law_1.2,6.220595169067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,2,power_law_1.2,0.7880576133728028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,1,power_law_1.2,7.0359039306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,1,power_law_1.2,8.317337799072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,1,power_law_1.2,9.427353668212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,2,power_law_1.2,1.2447744369506837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,1,power_law_1.2,11.121049499511718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,1,power_law_1.2,12.60769271850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,2,power_law_1.2,1.9697664260864258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,1,power_law_1.2,15.796018981933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,16,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,16,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,16,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,16,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,16,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,16,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,16,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,16,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,16,power_law_1.2,0.03173120021820068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,16,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,16,power_law_1.2,0.03930239975452423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,16,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,16,power_law_1.2,0.053446400165557864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,16,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,16,power_law_1.2,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,16,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,16,power_law_1.2,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,16,power_law_1.2,0.12984319925308227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,16,power_law_1.2,0.16179200410842895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,16,power_law_1.2,0.21585919857025146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,16,power_law_1.2,0.3121151924133301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,1,power_law_1.2,19.000729370117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,16,power_law_1.2,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,16,power_law_1.2,0.6918144226074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,16,power_law_1.2,0.9494527816772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,32,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,32,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,32,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,32,balanced,0.050853331883748375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,32,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,32,balanced,0.2850133379300435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,32,balanced,0.2860373258590698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,32,balanced,0.2874026695887248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,32,balanced,0.29764266808827716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,32,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,32,balanced,0.29098665714263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,32,balanced,0.29286400477091473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,32,balanced,0.2949120004971822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,32,balanced,0.29764266808827716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,32,balanced,0.3027626673380534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,32,balanced,0.3058346708615621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,32,balanced,0.3131626645723979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,32,balanced,0.3295573393503825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,32,balanced,0.3415040175120036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,32,balanced,0.3633493185043335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,32,balanced,0.40004265308380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,32,balanced,0.4370773235956828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,32,balanced,0.5056853294372559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,32,balanced,0.6287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,32,balanced,0.7837013403574625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,1,power_law_1.2,24.68659210205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,32,balanced,1.0576213200887044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,32,balanced,1.3725013732910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,2,power_law_1.2,2.69168643951416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,16,power_law_1.2,1.4413824081420898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,1,power_law_1.2,29.6281982421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,2,power_law_1.2,3.5747840881347654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,1,power_law_1.2,40.96102294921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,16,power_law_1.2,1.7963008880615234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,8,power_law_1.01,1.622220802307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,8,power_law_1.01,2.811084747314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,8,power_law_1.01,2.56942081451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,8,power_law_1.01,3.0320640563964845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,8,power_law_1.01,3.52542724609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,8,power_law_1.01,4.030259323120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,8,power_law_1.01,3.3695743560791014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,8,power_law_1.01,3.408281707763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,8,power_law_1.01,3.6354049682617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,8,power_law_1.01,3.698252868652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,8,power_law_1.01,3.5987457275390624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,8,power_law_1.01,3.7222400665283204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,8,power_law_1.01,3.9407615661621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,8,power_law_1.01,4.038451385498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,8,power_law_1.01,4.0378368377685545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,8,power_law_1.01,4.075724792480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,8,power_law_1.01,4.119142532348633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,8,power_law_1.01,4.214374542236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,8,power_law_1.01,4.414649581909179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,8,power_law_1.01,4.833894348144531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,1,power_law_1.2,52.895947265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,8,power_law_1.01,5.2516735076904295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,8,power_law_1.01,6.318080139160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,8,power_law_1.01,6.523052978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,16,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,16,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,16,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,16,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,16,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,16,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,16,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,16,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,16,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,16,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,16,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,8,power_law_1.01,8.026290893554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,16,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,16,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,16,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,16,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,16,balanced,0.06929066777229309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,16,balanced,0.08243200182914734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,16,balanced,0.10393599669138591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,16,balanced,0.24439465999603271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,16,balanced,0.2839733362197876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,16,balanced,0.37512532869974774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,16,balanced,0.463701327641805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,16,balanced,0.679423967997233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,16,balanced,0.934229294459025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,8,power_law_1.01,9.674752044677735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,8,power_law_1.01,13.280665588378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,8,power_law_1.01,15.779840087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,256,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,256,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,256,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,256,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,256,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,256,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,256,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,256,power_law_1.2,0.040729600191116336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,256,power_law_1.2,0.04156160056591034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,256,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,256,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,256,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,256,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,256,power_law_1.2,0.04953599870204926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,256,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,256,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,256,power_law_1.2,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,256,power_law_1.2,0.10032639503479004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,256,power_law_1.2,0.13660160303115845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,256,power_law_1.2,0.17960959672927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,256,power_law_1.2,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,256,power_law_1.2,0.3874624013900757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,256,power_law_1.2,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,256,power_law_1.2,0.8988608360290528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,256,power_law_1.2,1.0590208053588868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,256,power_law_1.2,1.5241024017333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,256,power_law_1.2,2.0520959854125977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,16,balanced,0.04470400015513102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,16,balanced,0.046575998266537987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,16,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,16,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,16,balanced,0.24934399127960205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,16,balanced,0.292522668838501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,16,balanced,0.29320534070332843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,16,balanced,0.29371732473373413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,16,balanced,0.29525333642959595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,16,balanced,0.2961066762606303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,16,balanced,0.29781333605448407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,16,balanced,0.30242133140563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,16,balanced,0.30427734057108563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,16,balanced,0.3063466747601827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,16,balanced,0.31436800956726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,16,balanced,0.318122665087382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,16,balanced,0.32614399989446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,16,balanced,0.3418453137079875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,16,balanced,0.3672746817270915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,16,balanced,0.4049919843673706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,16,balanced,0.4500480095545451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,16,balanced,0.5358933210372925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,16,balanced,0.6579200029373169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,16,balanced,0.9965226650238037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,16,balanced,1.2822186946868896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,16,balanced,1.815872033437093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,16,balanced,2.3478612899780273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,2,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,2,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,2,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,2,power_law_1.2,0.21565439701080322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,2,power_law_1.2,0.2703360080718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,2,power_law_1.2,0.3512320041656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,2,power_law_1.2,0.501145601272583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,2,power_law_1.2,0.5242879867553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,2,power_law_1.2,0.5363711833953857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,2,power_law_1.2,0.5144576072692871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,2,power_law_1.2,0.5931007862091064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,2,power_law_1.2,0.6094848155975342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,2,power_law_1.2,0.5928959846496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,2,power_law_1.2,0.6449024200439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,2,power_law_1.2,0.6705152034759522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,2,power_law_1.2,0.6889472007751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,2,power_law_1.2,0.7184383869171143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,2,power_law_1.2,0.775987195968628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,2,power_law_1.2,0.7847936153411865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,2,power_law_1.2,0.9226240158081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,2,power_law_1.2,1.0297344207763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,2,power_law_1.2,1.291263961791992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,2,power_law_1.2,1.5241215705871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,2,power_law_1.2,2.1350400924682615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,2,power_law_1.2,2.5597951889038084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,2,power_law_1.2,3.711590576171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,2,power_law_1.2,4.434329605102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,4,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,4,balanced,0.03446933378775915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,4,balanced,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,4,balanced,0.4522666533788045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,4,balanced,0.45550934473673504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,4,balanced,0.45721598466237384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,4,balanced,0.45875199635823566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,4,balanced,0.4614826838175456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,4,balanced,0.46300800641377765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,4,balanced,0.466261347134908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,4,balanced,0.47121067841847736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,4,balanced,0.4734293222427368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,4,balanced,0.47940266132354736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,4,balanced,0.4891306559244792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,4,balanced,0.49544533093770343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,4,balanced,0.5106346607208252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,4,balanced,0.5410133202870687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,4,balanced,0.5495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,4,balanced,0.6176426808039347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,4,balanced,0.6579200029373169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,4,balanced,0.8185173670450846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,4,balanced,0.9854293664296468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,4,balanced,1.3834239641825359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,4,balanced,1.6984747250874836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,4,balanced,2.516138712565104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,4,balanced,3.2860161463419595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,32,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,32,power_law_1.2,0.027641600370407103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,32,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,32,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,32,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,32,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,32,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,32,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,32,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,32,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,32,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,32,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,32,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,32,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,32,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,32,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,32,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,32,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,32,power_law_1.2,0.06961920261383056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,32,power_law_1.2,0.10506240129470826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,32,power_law_1.2,0.12778240442276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,32,power_law_1.2,0.25620479583740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,32,power_law_1.2,0.3422208070755005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,32,power_law_1.2,0.5853184223175049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,32,power_law_1.2,0.7051263809204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,32,power_law_1.2,1.2797951698303223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,4,power_law_1.2,0.048518401384353635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,4,power_law_1.2,0.15174399614334105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,4,power_law_1.2,0.2076672077178955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,4,power_law_1.2,0.3346303939819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,4,power_law_1.2,0.35532801151275634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,32,balanced,0.029178666571776073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,32,balanced,0.02865600089232127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,32,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,32,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,32,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,32,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,32,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,32,balanced,0.03532266616821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,32,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,32,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,32,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,32,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,32,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,32,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,32,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,32,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,32,balanced,0.06126399834950765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,32,balanced,0.09847467144330342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,32,balanced,0.16110933820406595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,4,power_law_1.2,0.43765759468078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,32,balanced,0.21282132466634116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,32,balanced,0.2744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,4,power_law_1.2,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,32,balanced,0.31964800755182904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,32,balanced,0.4128426710764567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,4,power_law_1.2,0.550707197189331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,32,balanced,0.5434026718139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,4,power_law_1.2,0.5816319942474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,32,balanced,0.8292693297068278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,4,power_law_1.2,0.5945343971252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,4,power_law_1.2,0.611737585067749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,32,balanced,1.1106986999511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,4,power_law_1.2,0.59269118309021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,4,power_law_1.2,0.6252543926239014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,4,power_law_1.2,0.638156795501709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,4,power_law_1.2,0.6356991767883301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,4,power_law_1.2,0.667033576965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,4,power_law_1.2,0.7159808158874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,4,power_law_1.2,0.7133056163787842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,4,power_law_1.2,0.7626751899719239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,4,power_law_1.2,0.8175616264343262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,4,power_law_1.2,0.9248767852783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,4,power_law_1.2,1.0489855766296388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,4,power_law_1.2,1.308672046661377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,4,power_law_1.2,1.7856512069702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,4,power_law_1.2,2.0744192123413088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,4,power_law_1.2,2.9214719772338866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,4,power_law_1.2,3.641958236694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,32,power_law_1.2,2.1477376937866213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,2,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,2,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,2,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,2,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,2,power_law_1.01,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,2,power_law_1.01,0.20930559635162355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,2,power_law_1.01,0.22118399143218995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,2,power_law_1.01,0.22364161014556885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,2,power_law_1.01,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,2,power_law_1.01,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,2,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,2,power_law_1.01,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,2,power_law_1.01,0.2437119960784912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,2,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,2,power_law_1.01,0.26255359649658205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,2,power_law_1.01,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,2,power_law_1.01,0.29061119556427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,2,power_law_1.01,0.3079871892929077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,2,power_law_1.01,0.3221503973007202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,2,power_law_1.01,0.36577279567718507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,2,power_law_1.01,0.4050943851470947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,2,power_law_1.01,0.547603178024292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,2,power_law_1.01,0.6899712085723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,2,power_law_1.01,0.9496576309204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,2,power_law_1.01,1.3156352043151855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,2,power_law_1.01,1.966886329650879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,2,power_law_1.01,2.5403392791748045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,16,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,16,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,16,balanced,0.28228267033894855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,16,balanced,0.5435733397801717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,16,balanced,1.0567680199940999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,16,balanced,2.0667573610941568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,16,balanced,3.0772905349731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,16,balanced,3.028309186299642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,16,balanced,3.029504140218099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,16,balanced,3.0317227045694985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,16,balanced,3.0426454544067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,16,balanced,3.0453761418660483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,16,balanced,3.050837198893229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,16,balanced,3.0586878458658853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,16,balanced,3.0687573750813804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,16,balanced,3.0740480422973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,16,balanced,3.0974292755126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,8,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,8,power_law_1.2,0.12165119647979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,16,balanced,3.1493120193481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,8,power_law_1.2,0.1275904059410095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,8,power_law_1.2,0.26070399284362794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,16,balanced,3.247104008992513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,8,power_law_1.2,0.2988032102584839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,8,power_law_1.2,0.15851520299911498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,16,balanced,3.3344853719075522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,8,power_law_1.2,0.31600639820098875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,8,power_law_1.2,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,16,balanced,3.3703254063924155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,8,power_law_1.2,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,8,power_law_1.2,0.3239936113357544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,16,balanced,3.474602699279785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,8,power_law_1.2,0.3278847932815552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,8,power_law_1.2,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,8,power_law_1.2,0.341811203956604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,16,balanced,4.027733484903972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,8,power_law_1.2,0.33280000686645506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,8,power_law_1.2,0.37150719165802004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,8,power_law_1.2,0.36126079559326174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,16,balanced,4.282880147298177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,8,power_law_1.2,0.3788800001144409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,8,power_law_1.2,0.393830394744873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,8,power_law_1.2,0.421068811416626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,8,power_law_1.2,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,16,balanced,4.682239850362142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,8,power_law_1.2,0.5123968124389648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,8,power_law_1.2,0.6147776126861573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,8,power_law_1.2,0.7876224040985107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,16,balanced,5.426858901977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,8,power_law_1.2,1.0049535751342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,8,power_law_1.2,1.3420543670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,16,balanced,5.928789138793945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,8,power_law_1.2,1.8741247177124023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,8,power_law_1.2,2.5845760345458983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,2,power_law_1.2,0.40261120796203614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,2,power_law_1.2,0.6391808032989502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,2,power_law_1.2,0.9859071731567383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,2,power_law_1.2,1.4170111656188964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,2,power_law_1.2,1.9402751922607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,2,power_law_1.2,3.2495616912841796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,2,power_law_1.2,3.2817150115966798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,2,power_law_1.2,3.4699134826660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,2,power_law_1.2,3.4076671600341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,2,power_law_1.2,3.568435287475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,2,power_law_1.2,3.746815872192383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,2,power_law_1.2,3.7748481750488283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,2,power_law_1.2,3.859455871582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,2,power_law_1.2,4.026367950439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,2,power_law_1.2,4.048479843139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,2,power_law_1.2,4.191820907592773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,2,power_law_1.2,4.3927360534667965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,2,power_law_1.2,4.515225601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,2,power_law_1.2,4.640972900390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,2,power_law_1.2,5.114470291137695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,2,power_law_1.2,6.002278518676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,2,power_law_1.2,7.113318634033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,2,power_law_1.2,7.878656005859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,2,power_law_1.2,9.892249298095702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,2,power_law_1.2,11.43746566772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,2,power_law_1.2,16.17162170410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,1,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,1,power_law_1.2,0.05201280117034912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,1,power_law_1.2,0.08212479948997498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,1,power_law_1.2,0.12943359613418579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,1,power_law_1.2,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,1,power_law_1.2,0.38236160278320314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,1,power_law_1.2,0.4108287811279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,1,power_law_1.2,0.4257728099822998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,1,power_law_1.2,0.45342721939086916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,1,power_law_1.2,0.4583424091339111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,1,power_law_1.2,0.4651008129119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,1,power_law_1.2,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,1,power_law_1.2,0.49602560997009276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,1,power_law_1.2,0.518342399597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,1,power_law_1.2,0.5429247856140137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,1,power_law_1.2,0.5650432109832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,1,power_law_1.2,0.5935103893280029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,1,power_law_1.2,0.6719488143920899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,2,power_law_1.2,19.93175048828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,1,power_law_1.2,0.7600128173828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,1,power_law_1.2,0.9592831611633301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,1,power_law_1.2,1.1544575691223145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,1,power_law_1.2,1.5931391716003418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,1,power_law_1.2,1.963827133178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,128,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,128,power_law_1.01,0.029894399642944335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,128,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,1,power_law_1.2,2.7451391220092773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,128,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,128,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,128,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,128,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,128,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,128,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,128,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,128,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,128,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,128,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,128,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,128,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,128,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,128,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,128,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,128,power_law_1.01,0.07842559814453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,128,power_law_1.01,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,128,power_law_1.01,0.14499839544296264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,128,power_law_1.01,0.1992640018463135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,128,power_law_1.01,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,128,power_law_1.01,0.44400639533996583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,128,power_law_1.01,0.6295551776885986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,128,power_law_1.01,0.993894386291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,128,power_law_1.01,1.3928447723388673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,1,power_law_1.2,3.5751937866210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,1,power_law_1.2,5.333606338500976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,1,power_law_1.2,7.1067649841308596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,4,power_law_1.01,0.17059839963912965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,4,power_law_1.01,0.19292160272598266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,4,power_law_1.01,0.28037118911743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,4,power_law_1.01,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,4,power_law_1.01,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,4,power_law_1.01,0.2803263902664185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,4,power_law_1.01,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,4,power_law_1.01,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,4,power_law_1.01,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,4,power_law_1.01,0.29409279823303225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,4,power_law_1.01,0.2959359884262085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,4,power_law_1.01,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,4,power_law_1.01,0.37150719165802004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,4,power_law_1.01,0.3586047887802124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,4,power_law_1.01,0.37396481037139895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,4,power_law_1.01,0.42287359237670896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,4,power_law_1.01,0.48148479461669924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,4,power_law_1.01,0.609664011001587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,4,power_law_1.01,0.7438208103179932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,4,power_law_1.01,0.9646080017089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,4,power_law_1.01,1.1626496315002441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,4,power_law_1.01,2.098374366760254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,4,power_law_1.01,2.486476707458496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,8,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,8,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,8,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,8,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,8,power_law_1.2,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,8,power_law_1.2,0.1439743995666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,8,power_law_1.2,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,8,power_law_1.2,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,8,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,8,power_law_1.2,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,8,power_law_1.2,0.12124160528182984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,8,power_law_1.2,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,8,power_law_1.2,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,8,power_law_1.2,0.1300480008125305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,8,power_law_1.2,0.1703935980796814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,8,power_law_1.2,0.1550336003303528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,8,power_law_1.2,0.21073920726776124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,8,power_law_1.2,0.23756160736083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,8,power_law_1.2,0.2488255977630615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,8,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,8,power_law_1.2,0.3319808006286621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,8,power_law_1.2,0.4058879852294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,8,power_law_1.2,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,8,power_law_1.2,0.7401343822479248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,8,power_law_1.2,0.971776008605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,8,power_law_1.2,1.5622143745422363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,4,power_law_1.01,3.8852607727050783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,8,power_law_1.2,2.246656036376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,8,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,8,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,8,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,8,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,8,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,8,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,8,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,8,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,8,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,8,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,8,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,8,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,8,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,8,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,8,power_law_1.2,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,8,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,8,power_law_1.2,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,8,power_law_1.2,0.11549439430236816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,8,power_law_1.2,0.2234368085861206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,4,power_law_1.01,4.728217697143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,8,power_law_1.2,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,8,power_law_1.2,0.4104191780090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,8,power_law_1.2,0.5441535949707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,4,power_law_1.01,7.154483032226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,4,power_law_1.01,0.40079360008239745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,4,power_law_1.01,0.746291208267212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,4,power_law_1.01,0.7882751941680908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,4,power_law_1.01,1.0270719528198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,4,power_law_1.01,1.264230442047119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,4,power_law_1.01,1.7184768676757813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,4,power_law_1.01,1.7309503555297852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,4,power_law_1.01,1.7764352798461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,4,power_law_1.01,1.804083251953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,4,power_law_1.01,1.863065528869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,4,power_law_1.01,1.8120704650878907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,4,power_law_1.01,1.8851839065551759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,4,power_law_1.01,1.9455999374389648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,4,power_law_1.01,1.9730432510375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,4,power_law_1.01,2.0330495834350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,4,power_law_1.01,2.025267219543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,4,power_law_1.01,2.109644889831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,4,power_law_1.01,2.2597631454467773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,4,power_law_1.01,2.398412895202637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,4,power_law_1.01,2.6411008834838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,4,power_law_1.01,2.9126655578613283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,4,power_law_1.01,3.4807807922363283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,32,power_law_1.01,0.22199039459228515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,1,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,1,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,32,power_law_1.01,0.19987839460372925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,1,balanced,0.24200532833735147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,1,balanced,0.24200532833735147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,1,balanced,0.24234666426976523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,1,balanced,0.24490666389465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,32,power_law_1.01,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,1,balanced,0.24678399165471396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,1,balanced,0.24849067131678262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,32,power_law_1.01,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,1,balanced,0.2510506709416707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,1,balanced,0.25257599353790283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,1,balanced,0.2563413381576538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,32,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,1,balanced,0.2595840096473694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,1,balanced,0.26282666126887005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,4,power_law_1.01,3.8483966827392577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,1,balanced,0.27356799443562824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,32,power_law_1.01,0.13783040046691894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,1,balanced,0.2759679953257243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,1,balanced,0.2887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,1,balanced,0.29474133253097534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,32,power_law_1.01,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,1,balanced,0.32494932413101196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,1,balanced,0.37085866928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,32,power_law_1.01,0.17285120487213135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,1,balanced,0.4642133315404256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,32,power_law_1.01,0.20377600193023682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,1,balanced,0.6004053354263306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,32,power_law_1.01,0.14970240592956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,1,balanced,0.9927679697672526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,32,power_law_1.01,0.20541439056396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,8,power_law_1.2,0.8126463890075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,1,balanced,1.3591893513997395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,32,power_law_1.01,0.18309119939804078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,4,power_law_1.01,5.065727996826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,32,power_law_1.01,0.21176319122314452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,1,balanced,2.0493653615315757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,32,power_law_1.01,0.1937407970428467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,32,power_law_1.01,0.20459520816802979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,32,power_law_1.01,0.2248703956604004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,1,balanced,2.7463413874308267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,32,power_law_1.01,0.23306241035461425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,32,power_law_1.01,0.2574336051940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,32,power_law_1.01,0.26398720741271975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,1,balanced,4.120746612548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,4,power_law_1.01,6.2269439697265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,32,power_law_1.01,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,32,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,32,power_law_1.01,0.4990975856781006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,1,balanced,5.505706787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,32,power_law_1.01,0.7120895862579346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,32,power_law_1.01,1.0768383979797362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,32,power_law_1.01,1.3875200271606445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,4,power_law_1.01,9.109913635253907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,32,power_law_1.01,2.1997568130493166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,32,power_law_1.01,2.821529579162598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,4,power_law_1.01,11.221401977539063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,4,power_law_1.01,8.492646026611329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,8,power_law_1.2,1.2212224006652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,2,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,2,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,2,power_law_1.01,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,2,power_law_1.01,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,2,power_law_1.01,0.4626431941986084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,2,power_law_1.01,0.4661248207092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,2,power_law_1.01,0.47942399978637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,2,power_law_1.01,0.4767744064331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,2,power_law_1.01,0.4923391819000244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,2,power_law_1.01,0.49459199905395507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,2,power_law_1.01,0.49621119499206545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,2,power_law_1.01,0.5072896003723144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,2,power_law_1.01,0.4976640224456787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,2,power_law_1.01,0.5414912223815918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,2,power_law_1.01,0.5808127880096435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,2,power_law_1.01,0.6236159801483154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,2,power_law_1.01,0.658841609954834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,2,power_law_1.01,0.8560640335083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,2,power_law_1.01,0.9637887954711915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,2,power_law_1.01,1.1333632469177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,2,power_law_1.01,1.6986112594604492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,2,power_law_1.01,2.3595008850097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,2,power_law_1.01,2.999910354614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,2,power_law_1.01,3.905740737915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,2,power_law_1.01,5.444198226928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,8,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,8,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,8,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,8,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,8,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,8,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,8,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,8,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,8,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,8,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,8,power_law_1.01,0.047916799783706665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,8,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,8,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,8,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,8,power_law_1.01,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,8,power_law_1.01,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,8,power_law_1.01,0.08580480217933655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,8,power_law_1.01,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,8,power_law_1.01,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,8,power_law_1.01,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,8,power_law_1.01,0.3547136068344116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,8,power_law_1.01,0.49602560997009276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,8,power_law_1.01,0.6608895778656005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,8,power_law_1.01,1.0735615730285644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,8,power_law_1.01,1.4532608032226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,2,power_law_1.01,7.839743804931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,4,power_law_1.01,1.6252927780151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,4,power_law_1.01,2.8483583450317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,4,power_law_1.01,3.074457550048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,4,power_law_1.01,4.355865478515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,4,power_law_1.01,4.513177490234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,4,power_law_1.2,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,4,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,4,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,4,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,4,power_law_1.01,7.3400321960449215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,4,power_law_1.2,0.05711359977722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,4,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,4,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,4,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,4,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,4,power_law_1.2,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,4,power_law_1.01,7.218380737304687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,4,power_law_1.2,0.06858239769935608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,4,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,4,power_law_1.2,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,4,power_law_1.2,0.10382080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,4,power_law_1.2,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,4,power_law_1.2,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,4,power_law_1.2,0.20848639011383058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,4,power_law_1.01,6.775603485107422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,4,power_law_1.2,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,4,power_law_1.2,0.30658559799194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,4,power_law_1.2,0.39669759273529054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,4,power_law_1.2,0.5111807823181153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,4,power_law_1.01,7.298867034912109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,4,power_law_1.2,0.7878655910491943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,4,power_law_1.2,1.0940095901489257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,4,power_law_1.01,7.297843170166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,4,power_law_1.2,1.7520639419555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,4,power_law_1.2,2.4133632659912108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,4,power_law_1.01,7.380377960205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,4,power_law_1.2,3.704832077026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,4,power_law_1.01,7.689830780029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,4,power_law_1.2,5.185945510864258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,4,power_law_1.01,7.410073852539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,4,power_law_1.01,7.896063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,4,power_law_1.01,8.207154846191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,4,power_law_1.01,8.311603546142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,4,power_law_1.01,8.374886322021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,4,power_law_1.01,8.329011535644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,4,power_law_1.01,8.999935913085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,4,power_law_1.01,9.05011215209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,4,power_law_1.01,10.11261444091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,2,power_law_1.01,12.121702575683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,4,power_law_1.01,11.95499496459961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,4,power_law_1.01,11.979366302490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,4,power_law_1.01,15.366316223144532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,4,power_law_1.01,17.593548583984376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,64,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,64,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,64,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,64,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,64,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,64,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,64,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,64,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,64,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,64,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,64,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,64,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,64,power_law_1.01,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,64,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,4,power_law_1.01,23.862681579589843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,64,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,64,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,64,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,64,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,64,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,64,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,64,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,64,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,64,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,64,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,64,balanced,0.03225066761175791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,64,balanced,0.03276266654332479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,64,power_law_1.01,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,64,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,64,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,64,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,64,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,64,power_law_1.01,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,64,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,64,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,64,balanced,0.047775998711586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,64,power_law_1.01,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,64,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,64,balanced,0.06860266625881195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,64,power_law_1.01,0.1572864055633545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,64,balanced,0.1549493372440338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,64,balanced,0.22664533058802286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,64,power_law_1.01,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,64,balanced,0.3319466710090637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,64,power_law_1.01,0.34938879013061525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,64,balanced,0.42393600940704346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,64,power_law_1.01,0.4554751873016357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,64,balanced,0.6307839949925741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,64,power_law_1.01,0.6635519981384277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,64,balanced,0.8791039784749349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,64,power_law_1.01,1.0145792007446288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,64,power_law_1.01,1.2410880088806153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,4,power_law_1.01,27.61318359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,16,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,16,balanced,0.04486933350563049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,16,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,16,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,16,balanced,0.2954240043958028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,16,balanced,0.5504000186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,16,balanced,0.8040106296539307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,16,balanced,0.7912106513977051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,16,balanced,0.7930880387624105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,16,balanced,0.7946240107218424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,16,balanced,0.7988906701405843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,16,balanced,0.8041813373565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,16,balanced,0.8070826530456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,16,balanced,0.8161280155181885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,16,balanced,0.8261973063151041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,16,balanced,0.833184003829956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,16,balanced,0.8506027062733968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,16,balanced,0.8782506783803304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,16,balanced,0.9084586302439371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,16,balanced,0.9657866954803467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,16,balanced,1.017685333887736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,16,balanced,1.126570701599121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,16,balanced,1.218389352162679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,16,balanced,1.4629546801249187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,16,balanced,1.8013866742451985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,16,balanced,2.4244906107584634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,16,balanced,3.0219945907592773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,2,balanced,0.6420319875081381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,2,balanced,1.1219627062479656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,2,balanced,2.1804374059041343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,2,balanced,4.334591865539551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,2,balanced,8.53877321879069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,2,balanced,10.672468821207682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,2,balanced,10.690731048583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,2,balanced,10.706400553385416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,2,balanced,10.720250447591146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,2,balanced,10.724522908528646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,2,balanced,10.762752532958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,2,balanced,10.799424489339193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,2,balanced,10.832725524902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,2,balanced,10.901162465413412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,2,balanced,10.989908854166666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,2,balanced,11.394388834635416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,2,balanced,11.496944427490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,2,balanced,11.903828938802084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,2,balanced,11.984879811604818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,2,balanced,14.40017064412435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,2,balanced,13.739861806233725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,2,balanced,15.356075286865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,2,balanced,14.885716756184896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,2,balanced,18.21011225382487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,2,balanced,21.367947896321613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,2,balanced,26.91430409749349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,2,balanced,34.46357218424479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,128,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,128,power_law_1.2,0.028646400570869444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,128,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,128,power_law_1.2,0.02927359938621521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,128,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,128,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,128,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,128,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,128,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,128,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,128,power_law_1.2,0.03950720131397247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,128,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,128,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,128,power_law_1.2,0.04503040015697479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,128,power_law_1.2,0.049132800102233885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,128,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,128,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,128,power_law_1.2,0.10567679405212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,128,power_law_1.2,0.12943359613418579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,128,power_law_1.2,0.208076810836792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,128,power_law_1.2,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,128,power_law_1.2,0.454041576385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,128,power_law_1.2,0.6045695781707764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,128,power_law_1.2,0.9762816429138184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,1,balanced,0.4657493432362874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,1,balanced,0.8787626425425211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,1,balanced,1.7278292973836262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,1,balanced,3.5150505701700845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,1,balanced,6.765055974324544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,1,balanced,6.78553581237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,1,balanced,6.802944183349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,1,balanced,6.810453414916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,1,balanced,6.8283735911051435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,1,balanced,6.845610936482747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,1,balanced,6.875989278157552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,1,balanced,6.914559682210286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,1,balanced,6.942207972208659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,128,power_law_1.2,1.1958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,1,balanced,7.016618728637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,1,balanced,7.292245229085286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,1,balanced,7.352832158406575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,1,balanced,7.460522969563802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,1,balanced,7.682389577229817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,1,balanced,8.415914535522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,1,balanced,8.491690953572592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,1,balanced,8.155989329020182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,1,balanced,8.995157241821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,1,balanced,9.735509236653646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,1,balanced,11.934378306070963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,1,balanced,14.440106709798178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,1,balanced,21.087914784749348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,1,balanced,27.471872965494793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,128,power_law_1.2,1.881292724609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,128,power_law_1.2,2.4776704788208006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,1,balanced,0.07628799974918365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,1,balanced,0.30241066217422485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,1,balanced,0.5908480087916056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,1,balanced,1.1272532939910889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,1,balanced,2.206378618876139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,1,balanced,2.764629364013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,1,balanced,2.778794606526693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,1,balanced,2.7927894592285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,1,balanced,2.8030293782552085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,1,balanced,2.819242795308431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,1,balanced,2.866490681966146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,1,balanced,2.8728319803873696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,1,balanced,2.898090680440267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,1,balanced,2.9405654271443686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,1,balanced,3.000831921895345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,1,balanced,3.106815973917643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,1,balanced,3.181568145751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,1,balanced,3.3609387079874673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,1,balanced,3.550719896952311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,1,balanced,3.795285224914551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,1,balanced,4.04855473836263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,1,balanced,4.905642509460449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,1,balanced,5.789695739746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,1,balanced,7.783423741658528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,1,balanced,9.328298568725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,1,balanced,13.302783966064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,1,balanced,17.215316772460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,8,power_law_1.01,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,8,power_law_1.01,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,8,power_law_1.01,0.5332992076873779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,8,power_law_1.01,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,8,power_law_1.01,0.5089280128479003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,8,power_law_1.01,0.6354752063751221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,8,power_law_1.01,0.6516736030578614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,8,power_law_1.01,0.6475776195526123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,8,power_law_1.01,0.6508543968200684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,8,power_law_1.01,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,8,power_law_1.01,0.6512639999389649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,8,power_law_1.01,0.6823935985565186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,8,power_law_1.01,0.6959104061126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,8,power_law_1.01,0.68853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,8,power_law_1.01,0.7260159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,8,power_law_1.01,0.7565311908721923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,8,power_law_1.01,0.7337984085083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,8,power_law_1.01,0.813260841369629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,8,power_law_1.01,0.8626175880432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,8,power_law_1.01,0.9598784446716309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,8,power_law_1.01,1.1481087684631348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,8,power_law_1.01,1.4366720199584961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,8,power_law_1.01,1.8675712585449218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,8,power_law_1.01,2.384281539916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,8,power_law_1.01,3.1029184341430662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,8,power_law_1.01,4.311654281616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,8,power_law_1.01,6.0618751525878904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,4,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,4,balanced,0.03751466671625773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,4,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,4,balanced,0.15871999661127725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,4,balanced,0.3595786492029826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,4,balanced,0.6712319850921631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,4,balanced,0.6748159726460775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,4,balanced,0.6758399804433187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,4,balanced,0.6783786614735922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,4,balanced,0.6807893117268881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,4,balanced,0.6840319633483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,4,balanced,0.688981294631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,4,balanced,0.6923946539560953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,4,balanced,0.7193546295166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,4,balanced,0.7075839837392172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,4,balanced,0.7142399946848551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,4,balanced,0.7268693447113037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,4,balanced,0.7536319891611735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,4,balanced,0.7821653683980306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,4,balanced,0.8359253406524658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,4,balanced,0.8965120315551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,4,balanced,0.9854293664296468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,4,balanced,1.0912426312764485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,4,balanced,1.3375147183736165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,4,balanced,1.6040959358215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,4,balanced,2.1145599683125815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,4,balanced,2.723994572957357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,128,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,128,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,128,balanced,0.03481066723664602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,128,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,128,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,128,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,128,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,128,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,128,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,128,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,128,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,128,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,128,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,128,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,128,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,128,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,128,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,128,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,128,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,128,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,128,balanced,0.0727040022611618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,128,balanced,0.09079466263453166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,128,balanced,0.10820266604423523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,128,balanced,0.24217599630355835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,128,balanced,0.31914667288462323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,128,balanced,0.48110934098561603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,128,balanced,0.6509226560592651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,2,power_law_1.2,0.5675007820129394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,2,power_law_1.2,0.8318976402282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,2,power_law_1.2,1.4950400352478028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,2,power_law_1.2,1.6730112075805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,2,power_law_1.2,1.7586175918579101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,2,power_law_1.2,1.7725439071655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,2,power_law_1.2,1.781350326538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,2,power_law_1.2,1.7913856506347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,2,power_law_1.2,1.8571264266967773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,2,power_law_1.2,2.060697555541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,8,power_law_1.2,1.0647551536560058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,2,power_law_1.2,2.3302143096923826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,8,power_law_1.2,2.1092351913452148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,2,power_law_1.2,2.3861248016357424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,8,power_law_1.2,2.8522432327270506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,2,power_law_1.2,2.5778175354003907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,8,power_law_1.2,3.2313343048095704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,2,power_law_1.2,2.331648063659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,2,power_law_1.2,2.878463935852051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,8,power_law_1.2,4.689715194702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,2,power_law_1.2,3.0906368255615235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,8,power_law_1.2,5.440505599975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,8,power_law_1.2,5.02476806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,2,power_law_1.2,3.5565567016601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,8,power_law_1.2,6.0116737365722654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,2,power_law_1.2,4.212326431274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,8,power_law_1.2,5.168320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,8,power_law_1.2,4.732928085327148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,2,power_law_1.2,5.049343872070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,8,power_law_1.2,4.645888137817383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,8,power_law_1.2,5.011846542358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,8,power_law_1.2,4.955955123901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,8,power_law_1.2,4.949196624755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,8,power_law_1.2,5.126144027709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,2,power_law_1.2,6.818585968017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,8,power_law_1.2,5.316403198242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,8,power_law_1.2,5.308620834350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,8,power_law_1.2,5.996543884277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,8,power_law_1.2,6.129049682617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,2,power_law_1.2,7.699456024169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,8,power_law_1.2,6.519987487792969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,8,power_law_1.2,6.953369903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,8,power_law_1.2,7.538278198242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,8,power_law_1.2,8.695398712158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,8,power_law_1.2,10.288333129882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,2,power_law_1.2,11.052236938476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,2,balanced,0.4867413441340129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,2,balanced,0.9094826380411783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,2,balanced,1.7433600425720215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,2,balanced,1.7547945976257324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,2,balanced,1.7530879974365234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,2,balanced,1.7662293116251628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,64,power_law_1.2,0.5511168003082275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,2,balanced,1.7754453023274739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,256,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,64,power_law_1.2,0.5549824237823486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,2,balanced,1.7860266367594402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,256,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,2,balanced,1.7923413912455242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,256,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,8,power_law_1.2,13.689447021484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,256,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,2,balanced,1.8001920382181804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,256,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,2,balanced,1.8165760040283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,256,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,2,balanced,1.8288639386494954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,256,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,64,power_law_1.2,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,2,balanced,1.8479785919189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,256,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,2,balanced,1.9720533688863118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,256,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,64,power_law_1.2,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,256,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,2,balanced,2.012330691019694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,256,power_law_1.2,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,64,power_law_1.2,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,2,balanced,2.0317866007486978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,256,power_law_1.2,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,256,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,64,power_law_1.2,0.5419007778167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,2,balanced,2.090496063232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,256,power_law_1.2,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,256,power_law_1.2,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,64,power_law_1.2,0.5531648159027099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,256,power_law_1.2,0.11100159883499146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,2,balanced,3.5007146199544272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,64,power_law_1.2,0.496230411529541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,256,power_law_1.2,0.16650240421295165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,256,power_law_1.2,0.24576001167297362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,2,balanced,3.634858767191569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,256,power_law_1.2,0.37027840614318847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,8,power_law_1.2,19.2321533203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,256,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,2,balanced,4.743338584899902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,256,power_law_1.2,0.7233407974243165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,64,power_law_1.2,0.5109632015228271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,256,power_law_1.2,1.0545151710510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,64,power_law_1.2,0.5242688179016113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,64,power_law_1.2,0.5400576114654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,2,balanced,6.2426401774088545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,256,power_law_1.2,1.4571519851684571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,64,power_law_1.2,0.5430975914001465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,64,power_law_1.2,0.5363711833953857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,64,power_law_1.2,0.5246975898742676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,256,power_law_1.2,2.648883247375488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,64,power_law_1.2,0.586956787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,2,balanced,8.040960311889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,64,power_law_1.2,0.5744639873504639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,256,power_law_1.2,3.776716613769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,64,power_law_1.2,0.6189055919647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,64,power_law_1.2,0.6549503803253174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,8,power_law_1.2,20.014662170410155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,2,power_law_1.2,12.148326110839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,64,power_law_1.2,0.7651328086853028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,2,balanced,9.922218958536783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,64,power_law_1.2,0.9099264144897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,256,power_law_1.2,5.860351943969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,64,power_law_1.2,1.190060806274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,64,power_law_1.2,1.6558080673217774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,2,balanced,13.141845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,64,power_law_1.2,1.8548736572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,256,power_law_1.2,8.87562255859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,64,power_law_1.2,2.3910400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,64,power_law_1.2,3.236044692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,2,balanced,16.563371022542317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,2,balanced,22.9027837117513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,64,power_law_1.2,4.915180969238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,64,power_law_1.2,6.08092155456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,2,balanced,29.745152791341145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,2,power_law_1.2,18.260960388183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,2,power_law_1.2,18.572901916503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,8,power_law_1.2,0.2553855895996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,8,power_law_1.2,0.20971519947052003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,8,power_law_1.2,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,8,power_law_1.2,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,8,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,8,power_law_1.2,0.4108287811279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,8,power_law_1.2,0.42270717620849607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,8,power_law_1.2,0.4208576202392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,8,power_law_1.2,0.45608959197998045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,8,power_law_1.2,0.43089919090270995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,8,power_law_1.2,0.4607999801635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,8,power_law_1.2,0.47022080421447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,8,power_law_1.2,0.45240321159362795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,8,power_law_1.2,0.4837376117706299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,8,power_law_1.2,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,8,power_law_1.2,0.4927487850189209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,8,power_law_1.2,0.49152002334594724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,8,power_law_1.2,0.5617663860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,8,power_law_1.2,0.5916672229766846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,8,power_law_1.2,0.7589888095855712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,8,power_law_1.2,0.9168895721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,8,power_law_1.2,1.2328960418701171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,8,power_law_1.2,1.4866432189941405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,8,power_law_1.2,2.186649513244629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,8,power_law_1.2,2.857369613647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,8,power_law_1.2,3.9714622497558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,2,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,2,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,2,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,2,balanced,0.16639999548594156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,2,balanced,0.3715413411458333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,2,balanced,0.4925440152486165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,2,balanced,0.4944159984588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,2,balanced,0.4877653519312541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,2,balanced,0.4896426598230998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,2,balanced,0.4920320113499959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,2,balanced,0.49544533093770343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,2,balanced,0.4991999864578247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,2,balanced,0.502613345781962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,2,balanced,0.5077333450317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,2,balanced,0.516266663869222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,2,balanced,0.5213866631189982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,2,balanced,0.5343573490778605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,2,balanced,0.5566986799240112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,2,balanced,0.5835093259811401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,2,balanced,0.6343679825464884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,2,balanced,0.6811306476593018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,2,balanced,0.7951359748840332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,2,balanced,0.9096533457438151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,2,balanced,1.184597333272298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,2,balanced,1.473024050394694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,32,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,2,balanced,2.0473173459370932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,32,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,2,balanced,2.6641066869099936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,32,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,32,power_law_1.01,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,32,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,32,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,32,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,32,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,32,power_law_1.01,0.05795199871063232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,32,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,32,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,32,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,32,power_law_1.01,0.06775040030479432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,32,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,32,power_law_1.01,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,32,power_law_1.01,0.09317119717597962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,32,power_law_1.01,0.12062720060348511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,32,power_law_1.01,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,32,power_law_1.01,0.24801280498504638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,32,power_law_1.01,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,32,power_law_1.01,0.3280895948410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,32,power_law_1.01,0.4182015895843506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,32,power_law_1.01,0.5173247814178467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,32,power_law_1.01,0.8218624114990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,32,power_law_1.01,1.1095999717712401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,32,power_law_1.01,1.7311744689941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,32,power_law_1.01,2.1436351776123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,2,power_law_1.2,35.097601318359374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,8,power_law_1.2,5.5955455780029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,2,power_law_1.2,37.946572875976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,16,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,16,power_law_1.01,0.04627839922904968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,16,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,16,power_law_1.01,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,16,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,16,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,16,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,16,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,16,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,16,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,16,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,16,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,16,power_law_1.01,0.05180799961090088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,16,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,16,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,16,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,16,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,16,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,16,power_law_1.01,0.0886784017086029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,16,power_law_1.01,0.1486847996711731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,16,power_law_1.01,0.23224320411682128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,16,power_law_1.01,0.35983359813690186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,16,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,16,power_law_1.01,0.8112128257751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,16,power_law_1.01,1.0751999855041503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,16,power_law_1.01,1.6955392837524415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,16,power_law_1.01,2.693734359741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,64,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,64,power_law_1.2,0.21994240283966066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,64,power_law_1.2,0.21933441162109374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,64,power_law_1.2,0.21729280948638915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,64,power_law_1.2,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,64,power_law_1.2,0.1013375997543335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,64,power_law_1.2,0.14376959800720215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,64,power_law_1.2,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,64,power_law_1.2,0.11878399848937989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,64,power_law_1.2,0.1738752007484436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,64,power_law_1.2,0.16485120058059693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,64,power_law_1.2,0.19169280529022217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,64,power_law_1.2,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,64,power_law_1.2,0.16526080369949342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,64,power_law_1.2,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,64,power_law_1.2,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,64,power_law_1.2,0.24305920600891112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,64,power_law_1.2,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,64,power_law_1.2,0.2721791982650757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,64,power_law_1.2,0.33320960998535154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,64,power_law_1.2,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,64,power_law_1.2,0.47226881980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,64,power_law_1.2,0.6479551792144775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,64,power_law_1.2,1.0270719528198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,64,power_law_1.2,1.3338624000549317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,64,power_law_1.2,2.284537506103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,64,power_law_1.2,2.437939262390137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,64,balanced,0.02678400029738744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,64,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,64,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,64,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,64,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,64,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,64,balanced,0.029850666721661884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,64,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,64,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,64,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,64,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,64,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,64,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,64,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,64,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,64,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,64,balanced,0.13482667009035745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,64,balanced,0.2764799992243449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,64,balanced,0.35549867153167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,64,balanced,0.555178682009379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,64,balanced,0.7406933307647705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,16,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,16,power_law_1.01,0.027641600370407103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,16,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,16,power_law_1.01,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,16,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,16,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,16,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,16,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,16,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,16,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,16,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,16,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,16,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,16,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,16,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,16,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,16,power_law_1.01,0.08293120265007019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,16,power_law_1.01,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,16,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,16,power_law_1.01,0.45752320289611814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,16,power_law_1.01,0.7378943920135498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,16,power_law_1.01,0.9811967849731446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,16,power_law_1.01,1.499955177307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,1,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,1,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,1,power_law_1.01,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,1,power_law_1.01,0.28876800537109376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,1,power_law_1.01,0.43457279205322263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,1,power_law_1.01,0.5505023956298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,8,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,1,power_law_1.01,0.7725056171417236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,8,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,1,power_law_1.01,0.8146944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,8,power_law_1.2,0.20131840705871581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,8,power_law_1.2,0.1921023964881897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,1,power_law_1.01,0.8685567855834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,8,power_law_1.2,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,8,power_law_1.2,0.22302720546722413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,8,power_law_1.2,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,8,power_law_1.2,0.20930559635162355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,8,power_law_1.2,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,8,power_law_1.2,0.2637824058532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,8,power_law_1.2,0.2521087884902954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,8,power_law_1.2,0.25477120876312254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,1,power_law_1.01,0.8771583557128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,8,power_law_1.2,0.2510848045349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,8,power_law_1.2,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,1,power_law_1.01,0.9160703659057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,8,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,8,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,1,power_law_1.01,0.9693183898925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,8,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,8,power_law_1.2,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,1,power_law_1.01,0.9850879669189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,8,power_law_1.2,0.3315711975097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,1,power_law_1.01,1.041203212738037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,8,power_law_1.2,0.3520512104034424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,8,power_law_1.2,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,1,power_law_1.01,1.0975232124328613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,8,power_law_1.2,0.5634047985076904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,1,power_law_1.01,1.1167743682861329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,8,power_law_1.2,0.812441635131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,1,power_law_1.01,1.1884544372558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,8,power_law_1.2,0.9283583641052247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,1,power_law_1.01,1.3600768089294433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,1,power_law_1.01,1.548902416229248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,128,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,128,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,1,power_law_1.01,1.8937856674194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,128,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,8,power_law_1.2,1.6300031661987304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,128,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,128,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,128,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,1,power_law_1.01,2.246246337890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,128,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,128,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,128,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,128,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,1,power_law_1.01,2.895462417602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,128,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,128,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,128,power_law_1.01,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,128,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,128,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,128,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,1,power_law_1.01,3.5792896270751955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,128,power_law_1.01,0.09359359741210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,128,power_law_1.01,0.11038719415664673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,128,power_law_1.01,0.15748480558395386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,128,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,128,power_law_1.01,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,1,power_law_1.01,4.978688049316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,128,power_law_1.01,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,128,power_law_1.01,0.6756351947784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,128,power_law_1.01,1.1409407615661622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,8,power_law_1.2,2.166169548034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,128,power_law_1.01,1.7049600601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,128,power_law_1.01,2.4887296676635744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,1,power_law_1.01,6.421094512939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,128,power_law_1.01,3.122585678100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,1,power_law_1.01,9.335193634033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,1,power_law_1.01,12.260147094726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,16,power_law_1.2,0.03194240033626557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,16,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,16,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,16,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,16,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,16,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,16,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,16,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,16,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,16,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,16,power_law_1.2,0.031116798520088196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,16,power_law_1.2,0.03234559893608093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,16,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,16,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,16,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,16,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,16,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,16,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,16,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,16,power_law_1.2,0.07086079716682434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,16,power_law_1.2,0.09460480213165283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,16,power_law_1.2,0.23633921146392822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,16,power_law_1.2,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,16,power_law_1.2,0.4972544193267822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,16,power_law_1.2,0.7358463764190674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,16,power_law_1.2,1.3492223739624023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,16,power_law_1.2,2.0150272369384767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,4,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,4,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,4,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,4,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,4,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,4,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,4,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,1,power_law_1.2,0.40611839294433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,4,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,1,power_law_1.2,0.7591936111450195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,4,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,4,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,4,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,4,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,1,power_law_1.2,1.4510080337524414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,4,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,4,power_law_1.01,0.0894976019859314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,4,power_law_1.01,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,1,power_law_1.2,2.37891845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,1,power_law_1.2,3.1934463500976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,4,power_law_1.01,0.15400960445404052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,4,power_law_1.01,0.18083839416503905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,1,power_law_1.2,5.9969535827636715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,4,power_law_1.01,0.20889599323272706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,4,power_law_1.01,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,1,power_law_1.2,6.456729888916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,1,power_law_1.2,6.7579902648925785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,1,power_law_1.2,7.068876647949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,1,power_law_1.2,7.266304016113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,1,power_law_1.2,7.402700805664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,1,power_law_1.2,7.641683197021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,4,power_law_1.01,0.4853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,1,power_law_1.2,7.964876556396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,1,power_law_1.2,8.216371154785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,1,power_law_1.2,8.427519989013671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,4,power_law_1.01,0.8015872001647949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,1,power_law_1.2,8.697241973876952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,1,power_law_1.2,8.903065490722657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,1,power_law_1.2,9.205554962158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,4,power_law_1.01,1.264230442047119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,1,power_law_1.2,9.466060638427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,1,power_law_1.2,10.076364898681641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,1,power_law_1.2,11.49889907836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,1,power_law_1.2,13.628799438476562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,1,power_law_1.2,14.955314636230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,1,power_law_1.2,19.071385192871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,1,power_law_1.2,22.825164794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,4,power_law_1.01,1.742835235595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,1,power_law_1.2,30.943026733398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,1,power_law_1.2,38.472293090820315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,2,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,2,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,2,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,2,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,2,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,2,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,2,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,2,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,2,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,2,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,2,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,2,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,2,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,2,power_law_1.01,0.051596802473068235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,2,power_law_1.01,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,2,power_law_1.01,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,2,power_law_1.01,0.07639039754867553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,2,power_law_1.01,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,2,power_law_1.01,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,2,power_law_1.01,0.23408639430999756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,4,power_law_1.01,2.757222366333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,2,power_law_1.01,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,64,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,64,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,64,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,64,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,64,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,64,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,64,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,64,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,64,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,64,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,64,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,64,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,64,power_law_1.01,0.04790399968624115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,64,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,64,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,64,power_law_1.01,0.09748479723930359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,64,power_law_1.01,0.11857919692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,64,power_law_1.01,0.1908735990524292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,64,power_law_1.01,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,64,power_law_1.01,0.3168256044387817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,64,power_law_1.01,0.4745215892791748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,64,power_law_1.01,0.6576128005981445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,2,power_law_1.01,0.4423679828643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,64,power_law_1.01,0.7669760227203369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,2,power_law_1.01,0.5633664131164551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,2,power_law_1.01,0.9760767936706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,2,power_law_1.01,1.354751968383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,4,power_law_1.01,2.978611183166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,2,power_law_1.01,2.2562816619873045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,2,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,2,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,2,power_law_1.2,0.026412799954414368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,2,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,2,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,2,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,2,power_law_1.2,0.03808639943599701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,2,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,2,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,2,power_law_1.2,0.04032639861106872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,2,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,2,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,2,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,2,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,2,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,2,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,2,power_law_1.2,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,2,power_law_1.2,0.13127679824829103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,2,power_law_1.2,0.19415040016174318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,2,power_law_1.2,0.23633921146392822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,2,power_law_1.2,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,2,power_law_1.2,0.38236160278320314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,2,power_law_1.2,0.5203968048095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,2,power_law_1.2,0.8122367858886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,2,power_law_1.01,2.9915136337280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,2,power_law_1.2,1.148313617706299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,2,power_law_1.2,1.7319936752319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,32,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,32,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,32,balanced,0.0407679999868075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,32,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,32,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,32,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,32,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,32,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,32,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,32,balanced,0.047930667797724404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,32,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,32,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,32,balanced,0.053743998209635414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,32,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,32,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,32,balanced,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,32,balanced,0.08959999680519104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,32,balanced,0.1867093245188395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,32,balanced,0.24285866816838583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,32,balanced,0.30873600641886395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,32,balanced,0.373418649037679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,2,power_law_1.2,2.2603776931762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,32,balanced,0.539136012395223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,32,balanced,0.7309652964274088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,32,balanced,1.060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,32,balanced,1.4238559405008953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,8,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,8,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,8,power_law_1.2,0.1640447974205017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,8,power_law_1.2,0.13696639537811278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,8,power_law_1.2,0.19432320594787597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,8,power_law_1.2,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,8,power_law_1.2,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,8,power_law_1.2,0.23119359016418456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,8,power_law_1.2,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,8,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,8,power_law_1.2,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,8,power_law_1.2,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,8,power_law_1.2,0.26030080318450927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,8,power_law_1.2,0.25701758861541746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,8,power_law_1.2,0.27197439670562745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,8,power_law_1.2,0.274617600440979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,8,power_law_1.2,0.2770944118499756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,8,power_law_1.2,0.2922111988067627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,8,power_law_1.2,0.30453760623931886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,8,power_law_1.2,0.3344383955001831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,8,power_law_1.2,0.3844095945358276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,8,power_law_1.2,0.5068799972534179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,8,power_law_1.2,0.610918378829956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,8,power_law_1.2,0.8003583908081054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,8,power_law_1.2,1.219974422454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,8,power_law_1.2,1.6138240814208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,8,power_law_1.2,2.18603515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,16,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,16,balanced,0.020474666108687718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,16,balanced,0.020309332758188248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,16,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,16,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,16,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,16,balanced,0.023717333873112995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,16,balanced,0.02372266600529353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,16,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,16,balanced,0.02405333270629247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,16,balanced,0.024735999604066212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,16,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,16,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,16,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,16,balanced,0.030533333619435627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,16,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,16,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,16,balanced,0.036677333215872444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,16,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,16,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,16,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,16,balanced,0.0936959981918335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,16,balanced,0.10393599669138591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,16,balanced,0.15751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,16,balanced,0.2032639980316162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,16,balanced,0.3510613441467285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,16,balanced,0.48349865277608234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,16,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,16,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,16,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,16,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,16,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,16,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,16,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,16,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,16,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,16,power_law_1.01,0.031123200058937074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,16,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,16,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,16,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,16,power_law_1.01,0.03971199989318848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,16,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,16,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,16,power_law_1.01,0.08089600205421447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,16,power_law_1.01,0.09277439713478089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,16,power_law_1.01,0.13946880102157594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,16,power_law_1.01,0.1505280017852783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,16,power_law_1.01,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,16,power_law_1.01,0.39813120365142823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,16,power_law_1.01,0.6199295997619629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,16,power_law_1.01,0.9472000122070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,8,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,8,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,8,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,8,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,8,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,8,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,8,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,8,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,8,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,8,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,8,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,8,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,8,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,8,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,8,balanced,0.08311466872692108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,8,balanced,0.10120532910029094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,8,balanced,0.15598932902018228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,8,balanced,0.16076800227165222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,8,balanced,0.3568640152613322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,8,balanced,0.4590933322906494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,8,balanced,0.7154346307118734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,8,balanced,0.9838933149973551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,2,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,2,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,2,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,2,power_law_1.01,0.1837056040763855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,2,power_law_1.01,0.2537472009658813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,2,power_law_1.01,0.3844095945358276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,2,power_law_1.01,0.397107195854187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,2,power_law_1.01,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,2,power_law_1.01,0.42639360427856443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,2,power_law_1.01,0.4587520122528076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,2,power_law_1.01,0.46059517860412597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,2,power_law_1.01,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,2,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,2,power_law_1.01,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,2,power_law_1.01,0.48148479461669924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,2,power_law_1.01,0.5005311965942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,2,power_law_1.01,0.5177343845367431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,2,power_law_1.01,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,2,power_law_1.01,0.5830656051635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,2,power_law_1.01,0.6440959930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,2,power_law_1.01,0.7137279987335206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,2,power_law_1.01,0.9138175964355468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,2,power_law_1.01,1.0774527549743653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,1,balanced,0.31522132953008014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,1,balanced,0.5369173288345337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,2,power_law_1.01,1.4843903541564942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,1,balanced,1.0333866278330486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,1,balanced,2.023423989613851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,2,power_law_1.01,1.8006015777587892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,1,balanced,4.01527468363444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,2,power_law_1.01,2.611199951171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,1,balanced,7.9221757253011065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,2,power_law_1.01,3.2520191192626955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,1,balanced,11.853995005289713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,1,balanced,11.872938791910807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,1,balanced,11.905530293782553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,2,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,2,power_law_1.01,0.6735807895660401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,2,power_law_1.01,1.0094592094421386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,1,balanced,11.933013916015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,2,power_law_1.01,1.491551971435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,2,power_law_1.01,1.841324806213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,2,power_law_1.01,2.8522239685058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,1,balanced,11.981461842854818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,2,power_law_1.01,3.075071907043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,2,power_law_1.01,3.1272960662841798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,1,balanced,12.025685628255209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,2,power_law_1.01,3.2159744262695313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,2,power_law_1.01,3.226828765869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,2,power_law_1.01,3.3138687133789064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,1,balanced,12.067498524983725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,2,power_law_1.01,3.3697792053222657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,2,power_law_1.01,3.4043647766113283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,1,balanced,12.147883097330729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,2,power_law_1.01,3.4494464874267576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,2,power_law_1.01,3.6317184448242186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,2,power_law_1.01,3.590348815917969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,1,balanced,12.219034830729166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,2,power_law_1.01,3.602431869506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,2,power_law_1.01,3.9022590637207033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,1,balanced,12.285439809163412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,2,power_law_1.01,4.007731246948242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,2,power_law_1.01,4.607795333862304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,1,balanced,12.422645568847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,2,power_law_1.01,5.1107841491699215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,1,balanced,12.651008605957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,2,power_law_1.01,6.263808059692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,2,power_law_1.01,6.609510040283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,1,balanced,12.879530588785807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,2,power_law_1.01,8.348876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,1,balanced,13.335552215576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,2,power_law_1.01,10.390937805175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,1,balanced,13.753504435221354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,1,balanced,14.664192199707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,2,power_law_1.01,14.367948913574219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,1,balanced,15.286783854166666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,2,power_law_1.01,18.032025146484376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,1,balanced,16.997690836588543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,1,balanced,18.227711995442707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,2,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,2,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,2,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,2,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,2,power_law_1.01,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,2,power_law_1.01,0.20969600677490235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,2,power_law_1.01,0.22159359455108643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,2,power_law_1.01,0.22302720546722413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,2,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,2,power_law_1.01,0.24145920276641847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,2,power_law_1.01,0.2447360038757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,2,power_law_1.01,0.2420736074447632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,2,power_law_1.01,0.26398720741271975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,2,power_law_1.01,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,2,power_law_1.01,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,1,balanced,21.836458841959637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,2,power_law_1.01,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,2,power_law_1.01,0.3115008115768433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,2,power_law_1.01,0.3559423923492432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,2,power_law_1.01,0.3848191976547241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,2,power_law_1.01,0.4784128189086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,2,power_law_1.01,0.6440959930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,2,power_law_1.01,1.052467155456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,2,power_law_1.01,1.2197888374328614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,2,power_law_1.01,1.8687936782836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,2,power_law_1.01,2.6083328247070314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,1,balanced,26.637311299641926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,2,power_law_1.01,3.845119857788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,2,power_law_1.01,5.184511947631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,1,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,1,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,1,power_law_1.2,0.07041919827461243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,1,power_law_1.2,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,1,power_law_1.2,0.19640320539474487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,1,power_law_1.2,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,1,power_law_1.2,0.39874560832977296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,1,power_law_1.2,0.42495999336242674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,1,power_law_1.2,0.4454400062561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,1,power_law_1.2,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,1,power_law_1.2,0.49395198822021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,1,power_law_1.2,0.5251071929931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,1,power_law_1.2,0.5355519771575927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,1,power_law_1.2,0.5738495826721192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,1,power_law_1.2,0.6281216144561768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,1,power_law_1.2,0.6711296081542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,16,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,1,power_law_1.2,0.7581632137298584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,16,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,16,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,1,power_law_1.2,0.9086976051330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,16,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,16,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,1,power_law_1.2,1.0596351623535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,16,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,16,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,1,power_law_1.2,1.4118847846984863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,16,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,16,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,1,power_law_1.2,1.7604608535766602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,16,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,16,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,1,balanced,0.8953173160552979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,16,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,1,balanced,1.737727959950765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,16,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,1,power_law_1.2,2.427494430541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,16,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,16,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,1,balanced,3.4321066538492837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,16,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,16,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,1,power_law_1.2,3.0863359451293944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,1,balanced,3.6360534032185874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,16,power_law_1.2,0.08110079765319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,16,power_law_1.2,0.10424319505691529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,1,balanced,3.5519145329793296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,16,power_law_1.2,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,16,power_law_1.2,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,1,balanced,3.4841601053873696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,16,power_law_1.2,0.38543360233306884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,16,power_law_1.2,0.561356782913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,1,balanced,3.5036160151163735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,16,power_law_1.2,0.9340928077697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,1,balanced,3.523242632548014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,1,power_law_1.2,4.471807861328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,16,power_law_1.2,1.1964415550231933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,1,balanced,3.5367253621419272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,1,balanced,3.5531094868977866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,1,power_law_1.2,5.951283264160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,1,balanced,3.5790506998697915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,1,balanced,3.6113065083821616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,1,balanced,3.6439040501912436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,1,balanced,3.8725973765055337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,1,power_law_1.2,8.951398468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,1,balanced,4.310698509216309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,1,balanced,4.361898740132649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,1,balanced,4.138325373331706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,1,power_law_1.2,11.839488220214843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,1,balanced,6.831274668375651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,16,power_law_1.2,2.4606655120849608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,1,balanced,7.092048009236653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,16,power_law_1.2,2.9734912872314454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,1,balanced,8.971946716308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,1,balanced,11.169450124104818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,1,balanced,14.281386057535807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,1,balanced,17.491967519124348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,1,balanced,23.042559305826824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,1,balanced,29.648213704427082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,1,balanced,43.62751770019531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,1,balanced,58.871297200520836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.4710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.8216575622558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.9951231956481934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,1,power_law_1.01,1.731545639038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,1,power_law_1.01,1.7717248916625976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,1,power_law_1.01,1.7518592834472657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,1,power_law_1.01,1.8487104415893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,1,power_law_1.01,1.845452880859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,1,power_law_1.01,1.8493440628051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,1,power_law_1.01,1.9125951766967773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,1,power_law_1.01,1.9695615768432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,1,power_law_1.01,2.0512767791748048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,1,power_law_1.01,2.0981760025024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,1,power_law_1.01,2.2665216445922853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,1,power_law_1.01,2.386515235900879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,1,power_law_1.01,2.488934326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,1,power_law_1.01,2.7830272674560548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,1,power_law_1.01,3.1495872497558595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,1,power_law_1.01,3.4021377563476562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,1,power_law_1.01,4.1936897277832035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,1,power_law_1.01,4.858879852294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,1,power_law_1.01,6.424569702148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,1,power_law_1.01,7.860626983642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,1,power_law_1.01,10.769190216064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,1,power_law_1.01,13.879501342773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,1,power_law_1.01,19.520069885253907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,1,power_law_1.01,25.14063415527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,2,power_law_1.2,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,2,power_law_1.2,0.2902015924453735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,2,power_law_1.2,0.49008641242980955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,2,power_law_1.2,0.6936575889587402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,2,power_law_1.2,1.0500096321105956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,2,power_law_1.2,1.3821951866149902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,2,power_law_1.2,1.5038463592529296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,2,power_law_1.2,2.129715156555176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,2,power_law_1.2,2.1616384506225588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,2,power_law_1.2,2.301747131347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,2,power_law_1.2,2.31280632019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,2,power_law_1.2,2.2771711349487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,2,power_law_1.2,2.5817024230957033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,2,power_law_1.2,2.5530368804931642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,2,power_law_1.2,2.7488256454467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,2,power_law_1.2,2.6421247482299806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,2,power_law_1.2,2.9204479217529298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,2,power_law_1.2,3.0023679733276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,2,power_law_1.2,3.2917247772216798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,2,power_law_1.2,3.6167678833007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,2,power_law_1.2,3.9825408935546873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,2,power_law_1.2,4.5985664367675785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,2,power_law_1.2,4.977459335327149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,2,power_law_1.2,6.443827056884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,2,power_law_1.2,7.5329536437988285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,2,power_law_1.2,10.745849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,8,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,8,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,8,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,8,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,8,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,8,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,8,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,8,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,8,balanced,0.03429333368937174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,8,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,8,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,8,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,8,balanced,0.03719466676314672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,2,power_law_1.2,12.312576293945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,32,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,8,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,8,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,8,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,8,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,32,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,8,balanced,0.08277333279450734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,8,balanced,0.0897706647713979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,8,balanced,0.13124266266822815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,8,balanced,0.16793066263198853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,8,balanced,0.27989333868026733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,32,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,8,balanced,0.3853653271993001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,32,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,8,balanced,0.5818026860555013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,32,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,32,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,8,balanced,0.7705600261688232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,32,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,32,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,8,balanced,1.1717973550160725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,32,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,32,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,32,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,8,balanced,1.6080212593078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,32,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,32,power_law_1.01,0.044633600115776065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,32,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,32,power_law_1.01,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,32,power_law_1.01,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,32,power_law_1.01,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,32,power_law_1.01,0.1435647964477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,32,power_law_1.01,0.18472959995269775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,32,power_law_1.01,0.22380800247192384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,32,power_law_1.01,0.3784703969955444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,32,power_law_1.01,0.5392320156097412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,32,power_law_1.01,0.8632320404052735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,32,power_law_1.01,1.1331583976745605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,1,power_law_1.2,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,1,power_law_1.2,0.20459520816802979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,1,power_law_1.2,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,1,power_law_1.2,0.4483071804046631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,1,power_law_1.2,0.4651008129119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,1,power_law_1.2,0.46530561447143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,1,power_law_1.2,0.45752320289611814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,1,power_law_1.2,0.46530561447143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,1,power_law_1.2,0.49786877632141113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,1,power_law_1.2,0.46694397926330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,1,power_law_1.2,0.49295358657836913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,1,power_law_1.2,0.49930238723754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,1,power_law_1.2,0.4937727928161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,1,power_law_1.2,0.49848318099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,1,power_law_1.2,0.5261312007904053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,1,power_law_1.2,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,1,power_law_1.2,0.5967872142791748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,1,power_law_1.2,0.7151616096496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,2,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,2,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,2,power_law_1.2,0.1908735990524292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,2,power_law_1.2,0.3278847932815552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,1,power_law_1.2,0.7909311771392822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,2,power_law_1.2,0.45096960067749026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,2,power_law_1.2,0.5015552043914795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,2,power_law_1.2,0.7682047843933105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,2,power_law_1.2,0.8286208152770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,2,power_law_1.2,0.8382464408874511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,2,power_law_1.2,0.881657600402832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,2,power_law_1.2,0.8847231864929199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,2,power_law_1.2,0.9490431785583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,2,power_law_1.2,0.9500672340393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,2,power_law_1.2,0.9687040328979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,2,power_law_1.2,1.0182656288146972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,2,power_law_1.2,1.0754048347473144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,2,power_law_1.2,1.1626496315002441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,1,power_law_1.2,1.0035200119018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,2,power_law_1.2,1.277952003479004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,2,power_law_1.2,1.3692864418029784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,2,power_law_1.2,1.5886336326599122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,2,power_law_1.2,1.8333696365356444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,2,power_law_1.2,2.1999616622924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,2,power_law_1.2,2.696601676940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,2,power_law_1.2,3.7672958374023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,2,power_law_1.2,4.546355056762695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,1,power_law_1.2,1.2752896308898927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,2,power_law_1.2,6.874317169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,2,power_law_1.2,8.287641906738282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,2,power_law_1.01,0.8196096420288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,2,power_law_1.01,0.8271871566772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,2,power_law_1.01,1.4143487930297851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,1,power_law_1.2,1.7059839248657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,2,power_law_1.01,1.7577983856201171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,2,power_law_1.01,1.7561599731445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,2,power_law_1.01,1.7692672729492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,2,power_law_1.01,1.7766399383544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,2,power_law_1.01,1.7930240631103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,2,power_law_1.01,1.9056640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,2,power_law_1.01,1.965260887145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,2,power_law_1.01,2.2198272705078126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,2,power_law_1.01,2.6124288558959963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,1,power_law_1.2,2.3177215576171877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,2,power_law_1.01,2.7328512191772463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,2,power_law_1.01,2.3549951553344726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,2,power_law_1.01,2.769715118408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,2,power_law_1.01,3.021824073791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,2,power_law_1.01,3.3497089385986327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,2,power_law_1.01,4.449280166625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,2,power_law_1.01,5.338931274414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,2,power_law_1.01,7.083417510986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,2,power_law_1.01,8.090624237060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,2,power_law_1.01,10.738278198242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,1,power_law_1.2,3.3077247619628904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,2,power_law_1.01,12.069273376464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,1,power_law_1.2,4.432486343383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,2,power_law_1.01,19.05500183105469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,2,power_law_1.01,21.406719970703126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,1,power_law_1.2,6.594764709472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,4,power_law_1.01,0.2750080108642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,4,power_law_1.01,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,4,power_law_1.01,0.37560319900512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,4,power_law_1.01,0.5480447769165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,4,power_law_1.01,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,4,power_law_1.01,0.5361663818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,4,power_law_1.01,0.5441535949707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,4,power_law_1.01,0.5531648159027099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,4,power_law_1.01,0.6002687931060791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,4,power_law_1.01,0.5810175895690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,4,power_law_1.01,0.6494143962860107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,4,power_law_1.01,0.7096320152282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,4,power_law_1.01,0.7972864151000977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,2,power_law_1.01,35.58359069824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,4,power_law_1.01,0.7571455955505371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,4,power_law_1.01,0.8353792190551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,4,power_law_1.01,0.879206371307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,4,power_law_1.01,1.0092351913452149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,4,power_law_1.01,1.3639679908752442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,4,power_law_1.01,1.67956485748291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,4,power_law_1.01,2.3517183303833007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,4,power_law_1.01,2.8450815200805666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,4,power_law_1.01,3.897747039794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,4,power_law_1.01,5.024736022949218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,4,power_law_1.01,6.832947540283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,1,power_law_1.2,8.684953308105468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,2,power_law_1.01,41.11278076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,64,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,64,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,64,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,64,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,64,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,64,power_law_1.01,0.033964800834655764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,64,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,64,power_law_1.01,0.036831998825073244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,64,power_law_1.01,0.041331198811531064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,64,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,64,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,64,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,64,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,64,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,64,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,64,power_law_1.01,0.08209279775619507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,64,power_law_1.01,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,64,power_law_1.01,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,64,power_law_1.01,0.184934401512146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,64,power_law_1.01,0.29061119556427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,64,power_law_1.01,0.32170240879058837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,64,power_law_1.01,0.45711359977722166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,64,power_law_1.01,0.612556791305542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,64,power_law_1.01,1.298431968688965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,64,power_law_1.01,1.3873151779174804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,64,power_law_1.01,2.329599952697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,64,power_law_1.01,2.649087905883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,4,power_law_1.01,10.314956665039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,16,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,16,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,16,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,16,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,16,balanced,0.029861333469549816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,16,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,16,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,16,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,16,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,16,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,16,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,16,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,16,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,16,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,16,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,16,balanced,0.06894933183987935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,16,balanced,0.0890880028406779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,16,balanced,0.2070186734199524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,16,balanced,0.26436267296473187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,16,balanced,0.37905065218607586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,16,balanced,0.4891306559244792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,16,balanced,0.8031573295593262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,16,balanced,1.0705920060475667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,4,power_law_1.01,14.36549072265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,2,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,2,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,2,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,2,power_law_1.2,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,2,power_law_1.2,0.17715200185775756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,2,power_law_1.2,0.3067903995513916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,2,power_law_1.2,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,2,power_law_1.2,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,2,power_law_1.2,0.33996798992156985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,2,power_law_1.2,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,2,power_law_1.2,0.3796736001968384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,2,power_law_1.2,0.3874815940856934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,2,power_law_1.2,0.39731199741363527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,2,power_law_1.2,0.4069375991821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,2,power_law_1.2,0.4472832202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,2,power_law_1.2,0.45443201065063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,2,power_law_1.2,0.48619518280029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,2,power_law_1.2,0.558899211883545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,2,power_law_1.2,0.6000639915466308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,2,power_law_1.2,0.7729152202606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,2,power_law_1.2,0.9564160346984864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,2,power_law_1.2,1.4071807861328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,2,power_law_1.2,1.7225727081298827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,2,power_law_1.2,2.5622528076171873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,2,power_law_1.2,3.194252777099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,16,power_law_1.2,0.05198720097541809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,16,power_law_1.2,0.06675840020179749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,16,power_law_1.2,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,16,power_law_1.2,0.214630389213562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,8,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,16,power_law_1.2,0.22548480033874513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,8,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,8,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,16,power_law_1.2,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,8,power_law_1.2,0.1931264042854309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,2,power_law_1.2,4.786995315551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,16,power_law_1.2,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,8,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,8,power_law_1.2,0.23101439476013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,16,power_law_1.2,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,8,power_law_1.2,0.27156479358673097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,16,power_law_1.2,0.18145279884338378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,8,power_law_1.2,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,8,power_law_1.2,0.2303999900817871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,16,power_law_1.2,0.14069759845733643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,8,power_law_1.2,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,16,power_law_1.2,0.17998720407485963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,8,power_law_1.2,0.264192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,8,power_law_1.2,0.25722880363464357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,16,power_law_1.2,0.17100800275802613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,8,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,16,power_law_1.2,0.2095103979110718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,8,power_law_1.2,0.2732032060623169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,8,power_law_1.2,0.27402238845825194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,16,power_law_1.2,0.20273919105529786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,8,power_law_1.2,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,16,power_law_1.2,0.23633921146392822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,8,power_law_1.2,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,16,power_law_1.2,0.23982079029083253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,8,power_law_1.2,0.35635199546813967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,8,power_law_1.2,0.3540992021560669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,16,power_law_1.2,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,16,power_law_1.2,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,8,power_law_1.2,0.46387200355529784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,16,power_law_1.2,0.3250175952911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,8,power_law_1.2,0.6098944187164307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,16,power_law_1.2,0.3926016092300415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,8,power_law_1.2,0.8671232223510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,16,power_law_1.2,0.43376641273498534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,8,power_law_1.2,1.0610688209533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,8,power_law_1.2,1.7082368850708007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,16,power_law_1.2,0.5720064163208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,8,power_law_1.2,2.168832015991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,16,power_law_1.2,0.7223296165466309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,16,power_law_1.2,1.1493375778198243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,8,power_law_1.2,3.178700828552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,16,power_law_1.2,1.5042559623718261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,8,power_law_1.2,4.148428726196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,16,power_law_1.2,2.414591979980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,16,power_law_1.2,3.3064960479736327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,2,power_law_1.2,6.320127868652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,4,power_law_1.01,16.544358825683595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,16,power_law_1.01,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,16,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,16,power_law_1.01,0.02088959962129593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,16,power_law_1.01,0.020684799551963805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,16,power_law_1.01,0.02109439969062805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,16,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,16,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,16,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,16,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,16,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,16,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,16,power_law_1.01,0.029254400730133058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,16,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,16,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,16,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,16,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,16,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,16,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,16,power_law_1.01,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,16,power_law_1.01,0.08335360288619995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,16,power_law_1.01,0.10974719524383544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,16,power_law_1.01,0.12184319496154786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,16,power_law_1.01,0.20725760459899903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,16,power_law_1.01,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,16,power_law_1.01,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,16,power_law_1.01,0.7847936153411865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,4,power_law_1.2,0.3215359926223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,4,power_law_1.2,0.5498879909515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,4,power_law_1.2,0.8005632400512696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,4,power_law_1.2,1.0448896408081054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,4,power_law_1.2,1.4063615798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,4,power_law_1.2,1.7504255294799804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,4,power_law_1.2,1.8827264785766602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,4,power_law_1.2,2.4756095886230467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,4,power_law_1.2,2.3220224380493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,4,power_law_1.2,2.315059280395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,4,power_law_1.2,2.3805952072143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,4,power_law_1.2,2.472345542907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,4,power_law_1.2,2.288640022277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,4,power_law_1.2,2.6984447479248046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,4,power_law_1.2,2.5372671127319335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,4,power_law_1.2,2.5556991577148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,4,power_law_1.2,2.880102348327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,4,power_law_1.2,3.0203903198242186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,4,power_law_1.2,3.0038015365600588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,4,power_law_1.2,3.4031551361083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,4,power_law_1.2,3.583385467529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,4,power_law_1.2,3.9432193756103517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,4,power_law_1.2,4.740095901489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,4,power_law_1.2,6.019481658935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,4,power_law_1.2,7.191142272949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,4,power_law_1.2,9.175039672851563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,4,power_law_1.2,10.889830780029296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,2,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,2,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,2,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,2,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,2,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,2,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,2,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,2,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,2,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,2,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,2,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,2,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,2,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,2,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,2,balanced,0.07492266595363617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,2,balanced,0.07969066500663757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,2,balanced,0.09523199995358785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,2,balanced,0.18500266472498575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,2,balanced,0.2126506765683492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,2,balanced,0.27187200387318927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,2,balanced,0.3333066701889038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,2,balanced,0.4940799872080485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,2,balanced,0.664576013882955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,2,balanced,1.0419200261433919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,2,balanced,1.4658560752868652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,2,balanced,2.29529603322347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,2,balanced,3.1400960286458335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,32,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,32,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,32,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,32,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,32,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,32,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,32,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,32,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,32,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,32,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,32,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,32,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,32,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,32,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,32,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,32,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,32,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,32,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,32,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,32,balanced,0.067071999112765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,32,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,32,balanced,0.091648002465566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,32,balanced,0.10854400197664897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,32,balanced,0.1646933356920878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,32,balanced,0.23176532983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,32,balanced,0.3968000014623006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,32,balanced,0.514901320139567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,4,power_law_1.01,0.3201024055480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,4,power_law_1.01,0.5402624130249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,4,power_law_1.01,0.6713344097137451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,4,power_law_1.01,0.8693759918212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,4,power_law_1.01,1.1603967666625976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,4,power_law_1.01,1.3756416320800782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,4,power_law_1.01,1.7303552627563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,4,power_law_1.01,1.8192384719848633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,4,power_law_1.01,1.8929664611816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,4,power_law_1.01,1.5857664108276368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,4,power_law_1.01,1.8200576782226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,4,power_law_1.01,1.8319360733032226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,4,power_law_1.01,1.8888320922851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,4,power_law_1.01,1.871232032775879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,4,power_law_1.01,1.925119972229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,4,power_law_1.01,1.9077119827270508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,4,power_law_1.01,2.004787254333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,4,power_law_1.01,2.1405696868896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,4,power_law_1.01,2.371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,4,power_law_1.01,2.488934326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,4,power_law_1.01,2.6134527206420897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,4,power_law_1.01,3.062374305725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,4,power_law_1.01,3.5915775299072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,4,power_law_1.01,4.504371261596679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,4,power_law_1.01,5.147647857666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,4,power_law_1.01,6.944153594970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,4,power_law_1.01,8.95629425048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,4,power_law_1.2,0.577126407623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,4,power_law_1.2,1.0364928245544434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,4,power_law_1.2,1.6726015090942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,4,power_law_1.2,2.310348892211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,4,power_law_1.2,2.838528060913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,4,power_law_1.2,3.5749889373779298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,4,power_law_1.2,3.9194625854492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,4,power_law_1.2,5.174867248535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,4,power_law_1.2,4.486758422851563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,4,power_law_1.2,4.3528190612792965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,4,power_law_1.2,4.21580810546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,4,power_law_1.2,4.727193450927734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,4,power_law_1.2,4.877312088012696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,4,power_law_1.2,4.751974487304688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,4,power_law_1.2,4.904140853881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,4,power_law_1.2,5.226905441284179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,4,power_law_1.2,5.25926399230957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,4,power_law_1.2,5.841305541992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,4,power_law_1.2,5.966643142700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,4,power_law_1.2,6.316236877441407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,4,power_law_1.2,6.525746917724609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,4,power_law_1.2,7.388159942626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,4,power_law_1.2,8.362188720703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,4,power_law_1.2,10.44295654296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,4,power_law_1.2,11.705958557128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,4,power_law_1.2,15.390106201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,4,power_law_1.2,18.932325744628905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,4,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,4,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,4,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,4,balanced,0.08311466872692108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,4,balanced,0.3131733338038127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,4,balanced,0.3767999807993571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,4,balanced,0.37939198811848956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,4,balanced,0.381930669148763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,4,balanced,0.3838293155034383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,4,balanced,0.3858773310979207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,4,balanced,0.39133866628011066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,4,balanced,0.39765334129333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,4,balanced,0.4024053414662679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,4,balanced,0.4106239875157674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,4,balanced,0.4225706656773885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,4,balanced,0.4312746524810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,4,balanced,0.4478293259938558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,4,balanced,0.4882773160934448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,4,balanced,0.5277013381322225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,4,balanced,0.5847040017445883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,4,balanced,0.6580906709035238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,4,balanced,0.884394645690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,4,balanced,1.0471893151601155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,4,balanced,1.4865066210428874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,4,balanced,1.9618132909138997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,4,balanced,2.9544105529785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,4,balanced,3.9002453486124673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,64,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,64,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,64,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,64,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,64,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,64,balanced,0.2986666758855184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,64,balanced,0.4312746524810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,64,balanced,0.4242773453394572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,64,balanced,0.425983985265096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,64,balanced,0.4270079930623372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,64,balanced,0.44919466972351074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,64,balanced,0.4344906806945801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,64,balanced,0.43689600626627606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,64,balanced,0.4427093267440796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,64,balanced,0.45124268531799316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,64,balanced,0.45636268456776935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,64,balanced,0.4657493432362874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,64,balanced,0.4882773160934448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,64,balanced,0.5126826763153076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,64,balanced,0.5575679937998453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,64,balanced,0.6022826830546061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,64,balanced,0.6790826320648193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,64,balanced,0.7531359990437826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,1,balanced,0.7517546812693278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,64,balanced,0.9441280364990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,1,balanced,1.4525119463602703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,64,balanced,1.1495893001556396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,1,balanced,2.8792905807495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,64,balanced,1.5358293851216633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,1,balanced,5.658453623453776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,64,balanced,1.969322681427002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,1,balanced,11.09435780843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,1,balanced,16.240623474121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,1,balanced,16.305323282877605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,1,balanced,16.352938334147137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,1,balanced,16.40222930908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,1,balanced,16.441856384277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,1,balanced,16.532821655273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,1,balanced,16.650922139485676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,1,balanced,16.714239756266277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,1,balanced,16.84667714436849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,1,balanced,16.989354451497395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,1,balanced,17.118208567301433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,256,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,256,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,256,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,256,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,256,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,256,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,256,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,256,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,1,balanced,17.348074595133465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,256,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,256,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,256,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,256,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,256,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,256,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,256,power_law_1.2,0.07475200295448303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,256,power_law_1.2,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,256,power_law_1.2,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,256,power_law_1.2,0.1282047986984253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,256,power_law_1.2,0.16588799953460692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,1,balanced,19.50754165649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,256,power_law_1.2,0.27463679313659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,256,power_law_1.2,0.43479042053222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,256,power_law_1.2,0.6060031890869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,256,power_law_1.2,0.7467008113861084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,256,power_law_1.2,1.2011520385742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,256,power_law_1.2,1.6117759704589845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,1,balanced,18.585428873697918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,256,power_law_1.2,3.030220794677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,256,power_law_1.2,3.9370750427246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,1,balanced,21.594624837239582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,1,balanced,19.031893412272137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,1,balanced,20.59926986694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,1,balanced,22.057301839192707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,1,balanced,25.756500244140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,8,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,8,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,8,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,8,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,8,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,8,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,8,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,8,balanced,0.03992533435424169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,8,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,8,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,8,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,8,balanced,0.07884799937407176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,8,balanced,0.12441600362459819
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,8,balanced,0.23347200949986777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,8,balanced,0.3198293248812358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,8,balanced,0.47274665037790936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,1,balanced,29.105494181315105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,8,balanced,0.6582613388697306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,8,balanced,1.0801493326822917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,8,balanced,1.4935040473937988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,1,balanced,39.218859354654946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,1,balanced,47.17004903157552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,4,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,4,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,4,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,4,power_law_1.01,0.05445759892463684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,4,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,4,power_law_1.01,0.10772479772567749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,4,power_law_1.01,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,4,power_law_1.01,0.14909440279006958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,4,power_law_1.01,0.1873792052268982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,4,power_law_1.01,0.18534400463104247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,4,power_law_1.01,0.1751039981842041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,4,power_law_1.01,0.2176896095275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,4,power_law_1.01,0.21442561149597167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,4,power_law_1.01,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,4,power_law_1.01,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,4,power_law_1.01,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,4,power_law_1.01,0.2717695951461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,4,power_law_1.01,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,4,power_law_1.01,0.3452928066253662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,4,power_law_1.01,0.39034879207611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,4,power_law_1.01,0.5081088066101074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,4,power_law_1.01,0.7350272178649903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,4,power_law_1.01,0.9805824279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,4,power_law_1.01,1.5226880073547364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,4,power_law_1.01,2.0123647689819335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,4,power_law_1.01,3.305062484741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,4,power_law_1.01,4.21662712097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,2,balanced,0.0718506673971812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,2,balanced,0.2996906638145447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,2,balanced,0.5870933135350546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,2,balanced,1.121951977411906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,2,balanced,2.184874693552653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,2,balanced,2.7289600372314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,2,balanced,2.740565299987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,2,balanced,2.748415946960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,2,balanced,2.7567787170410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,2,balanced,2.7636054356892905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,2,balanced,2.780501365661621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,2,balanced,2.7975680033365884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,2,balanced,2.8158133824666343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,2,balanced,2.8453547159830728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,2,balanced,2.8803412119547525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,2,balanced,2.9789867401123047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,2,balanced,3.0351359049479165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,2,balanced,3.1351467768351235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,2,balanced,3.21996275583903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,2,balanced,3.5886081059773765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,2,balanced,3.4851840337117515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,2,balanced,3.935061454772949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,2,balanced,4.427605311075847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,2,balanced,5.50382932027181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,2,balanced,6.8742828369140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,2,balanced,9.737728118896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,2,balanced,12.6561279296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,16,power_law_1.2,0.3158015966415405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,16,power_law_1.2,0.5406720161437988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,16,power_law_1.2,0.7755775928497315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,16,power_law_1.2,0.7483391761779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,16,power_law_1.2,0.788479995727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,16,power_law_1.2,0.7999296188354492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,16,power_law_1.2,0.8040448188781738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,16,power_law_1.2,0.6748159885406494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,16,power_law_1.2,0.6543360233306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,16,power_law_1.2,0.6041408061981202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,16,power_law_1.2,0.6320064067840576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,16,power_law_1.2,0.632422399520874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,16,power_law_1.2,0.6500351905822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,16,power_law_1.2,0.6512639999389649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,16,power_law_1.2,0.662937593460083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,16,power_law_1.2,0.744652795791626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,16,power_law_1.2,0.7544832229614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,16,power_law_1.2,0.8138751983642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,16,power_law_1.2,0.8382464408874511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,16,power_law_1.2,0.9496576309204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,16,power_law_1.2,1.0778623580932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,16,power_law_1.2,1.4022656440734864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,16,power_law_1.2,1.5853568077087403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,16,power_law_1.2,2.04083194732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,16,power_law_1.2,2.700288009643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,8,power_law_1.01,0.33914880752563475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,16,power_law_1.2,3.905535888671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,8,power_law_1.01,0.5111743927001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,8,power_law_1.01,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,8,power_law_1.01,0.5287936210632325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,8,power_law_1.01,0.6469632148742676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,8,power_law_1.01,0.6260735988616943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,16,power_law_1.2,5.023328018188477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,8,power_law_1.01,0.6393856048583985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,8,power_law_1.01,0.6535168170928956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,8,power_law_1.01,0.7057216167449951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,8,power_law_1.01,0.7067327976226807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,8,power_law_1.01,0.7165952205657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,8,power_law_1.01,0.7040703773498536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,8,power_law_1.01,0.7124991893768311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,8,power_law_1.01,0.7405568122863769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,8,power_law_1.01,0.7544832229614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,8,power_law_1.01,0.7890944004058837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,8,power_law_1.01,0.7940095901489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,8,power_law_1.01,0.8185855865478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,8,power_law_1.01,0.8966143608093262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,8,power_law_1.01,1.0258432388305665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,8,power_law_1.01,1.0952704429626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,8,power_law_1.01,1.51592960357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,8,power_law_1.01,1.78155517578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,8,power_law_1.01,2.613657569885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,8,power_law_1.01,2.7000831604003905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,8,power_law_1.01,4.432281494140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,8,power_law_1.01,5.18737907409668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,32,power_law_1.01,0.1908735990524292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,32,power_law_1.01,0.19025919437408448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,32,power_law_1.01,0.19230719804763793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,32,power_law_1.01,0.19390720129013062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,32,power_law_1.01,0.12225279808044434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,32,power_law_1.01,0.08417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,32,power_law_1.01,0.11465599536895751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,32,power_law_1.01,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,32,power_law_1.01,0.13553919792175292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,32,power_law_1.01,0.11980160474777221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,32,power_law_1.01,0.13783040046691894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,32,power_law_1.01,0.14824960231781006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,32,power_law_1.01,0.16363519430160522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,32,power_law_1.01,0.15134719610214234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,32,power_law_1.01,0.13107199668884278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,32,power_law_1.01,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,32,power_law_1.01,0.16977920532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,32,power_law_1.01,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,32,power_law_1.01,0.20435841083526612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,32,power_law_1.01,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,32,power_law_1.01,0.29818880558013916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,32,power_law_1.01,0.36188158988952634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,32,power_law_1.01,0.4185984134674072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,32,power_law_1.01,0.5988351821899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,32,power_law_1.01,0.8554495811462403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,32,power_law_1.01,1.1513855934143067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,32,power_law_1.01,1.7293312072753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,16,power_law_1.2,0.03849599957466125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,16,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,16,power_law_1.2,0.040940800309181215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,16,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,16,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,16,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,16,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,16,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,16,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,16,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,16,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,16,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,16,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,16,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,16,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,16,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,16,power_law_1.2,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,16,power_law_1.2,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,16,power_law_1.2,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,16,power_law_1.2,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,16,power_law_1.2,0.19987200498580932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,16,power_law_1.2,0.2752511978149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,16,power_law_1.2,0.42330241203308105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,16,power_law_1.2,0.6418432235717774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,16,power_law_1.2,1.0065919876098632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,16,power_law_1.2,1.5400959968566894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,2,power_law_1.01,0.32460799217224123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,2,power_law_1.01,0.5746687889099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,2,power_law_1.01,0.6266880035400391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,2,power_law_1.01,1.0323967933654785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,2,power_law_1.01,1.0348480224609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,2,power_law_1.01,1.0555392265319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,2,power_law_1.01,1.0643391609191895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,2,power_law_1.01,1.1808768272399903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,2,power_law_1.01,1.2505023956298829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,2,power_law_1.01,1.3920255661010743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,2,power_law_1.01,1.255833625793457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,2,power_law_1.01,1.3238271713256835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,2,power_law_1.01,1.3256704330444335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,2,power_law_1.01,1.4292991638183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,2,power_law_1.01,1.6703424453735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,2,power_law_1.01,1.760051155090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,2,power_law_1.01,2.0523008346557616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,2,power_law_1.01,2.387148857116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,2,power_law_1.01,2.6357759475708007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,2,power_law_1.01,3.243212890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,2,power_law_1.01,3.6827136993408205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,2,power_law_1.01,4.922771072387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,2,power_law_1.01,6.532505798339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,2,power_law_1.01,7.825202941894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,2,power_law_1.01,10.773503875732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,2,power_law_1.01,13.105970764160157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,8,power_law_1.2,0.6039552211761474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,8,power_law_1.2,1.0579968452453614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,8,power_law_1.2,0.8570816040039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,8,power_law_1.2,1.2478464126586915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,8,power_law_1.2,1.4571200370788575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,8,power_law_1.2,1.7989631652832032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,8,power_law_1.2,1.7379327774047852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,4,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,4,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,8,power_law_1.2,1.7475391387939454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,4,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,4,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,8,power_law_1.2,1.9003263473510743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,4,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,4,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,8,power_law_1.2,1.6400384902954102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,4,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,4,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,8,power_law_1.2,1.7739776611328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,4,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,4,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,8,power_law_1.2,1.8368127822875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,4,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,4,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,8,power_law_1.2,1.8505727767944335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,4,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,4,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,8,power_law_1.2,1.796895980834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,4,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,4,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,4,power_law_1.2,0.07454720139503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,8,power_law_1.2,1.9906303405761718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,4,power_law_1.2,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,4,power_law_1.2,0.10588159561157226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,8,power_law_1.2,2.023423957824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,8,power_law_1.01,0.5578752040863038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,4,power_law_1.2,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,8,power_law_1.01,1.0364928245544434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,4,power_law_1.2,0.25395200252532957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,8,power_law_1.2,2.191564750671387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,4,power_law_1.2,0.33320960998535154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,4,power_law_1.2,0.4114431858062744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,8,power_law_1.01,2.0160512924194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,8,power_law_1.2,2.159404754638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,4,power_law_1.2,0.6699007987976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,8,power_law_1.01,1.7336320877075195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,8,power_law_1.2,2.329599952697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,4,power_law_1.2,0.9246720314025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,2,power_law_1.01,20.236697387695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,8,power_law_1.01,2.246860885620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,8,power_law_1.2,2.4971263885498045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,4,power_law_1.2,1.7485824584960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,8,power_law_1.01,2.593177604675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,8,power_law_1.2,2.6957759857177734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,4,power_law_1.2,2.34332160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,8,power_law_1.01,2.720358467102051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,8,power_law_1.2,3.2129024505615233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,8,power_law_1.01,2.588262367248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,8,power_law_1.2,4.001792144775391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,8,power_law_1.01,2.7897855758666994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,8,power_law_1.01,2.34085750579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,8,power_law_1.2,5.599635314941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,8,power_law_1.01,2.522316741943359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,8,power_law_1.01,2.253414344787598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,8,power_law_1.2,5.532672119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,8,power_law_1.01,2.6894336700439454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,8,power_law_1.01,2.45166072845459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,8,power_law_1.2,8.441651153564454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,8,power_law_1.01,2.870681571960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,8,power_law_1.01,2.7027456283569338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,8,power_law_1.01,2.7252735137939452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,8,power_law_1.2,10.456249237060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,8,power_law_1.01,2.708684730529785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,8,power_law_1.01,2.9925376892089846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,8,power_law_1.01,3.1019008636474608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,8,power_law_1.01,3.2182273864746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,8,power_law_1.01,3.5495937347412108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,8,power_law_1.01,4.032102584838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,8,power_law_1.01,4.968243026733399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,8,power_law_1.01,6.157926559448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,8,power_law_1.01,8.214527893066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,8,power_law_1.01,9.531391906738282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,64,balanced,0.06502399841944377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,64,balanced,0.05649066468079885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,64,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,64,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,64,balanced,0.28962133328119916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,64,balanced,0.5486933390299479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,64,balanced,0.8091306686401367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,64,balanced,0.8069120248158773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,64,balanced,0.8084479967753092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,64,balanced,0.8096373081207275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,64,balanced,0.8034986654917399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,64,balanced,0.8084479967753092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,64,balanced,0.8098133405049642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,64,balanced,0.8162986437479655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,64,balanced,0.8229546546936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,64,balanced,0.8256853421529134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,64,balanced,0.8343893686930338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,64,balanced,0.8500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,64,balanced,0.8710827032725016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,64,balanced,0.8989013036092123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,64,balanced,0.9391787052154541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,64,balanced,0.9968640009562174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,64,balanced,1.1380053361256917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,64,balanced,1.313962697982788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,64,balanced,1.5250773429870605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,64,balanced,1.7551360130310059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,64,balanced,2.077184041341146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,1,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,1,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,1,power_law_1.01,0.18408960103988647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,1,power_law_1.01,0.3282815933227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,1,power_law_1.01,0.43765759468078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,1,power_law_1.01,0.721504020690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,1,power_law_1.01,0.7573503971099853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,1,power_law_1.01,0.8220671653747559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,1,power_law_1.01,0.8171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,1,power_law_1.01,0.8568832397460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,1,power_law_1.01,0.8728575706481934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,1,power_law_1.01,0.8992768287658691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,1,power_law_1.01,0.9127936363220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,1,power_law_1.01,0.9504768371582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,1,power_law_1.01,0.94268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,1,power_law_1.01,0.9797632217407226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,1,power_law_1.01,1.0078207969665527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,1,power_law_1.01,1.0743424415588378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,1,power_law_1.01,1.1323391914367675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,1,power_law_1.01,1.255628776550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,1,power_law_1.01,1.4159808158874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,1,power_law_1.01,1.7235967636108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,1,power_law_1.01,1.96362247467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,1,power_law_1.01,2.6503168106079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,1,power_law_1.01,3.0914560317993165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,1,power_law_1.01,4.301414489746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,1,power_law_1.01,5.3393409729003904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,4,power_law_1.01,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,4,power_law_1.01,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,4,power_law_1.01,0.19927040338516236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,4,power_law_1.01,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,4,power_law_1.01,0.24574079513549804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,4,power_law_1.01,0.24801280498504638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,4,power_law_1.01,0.2521087884902954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,4,power_law_1.01,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,4,power_law_1.01,0.2629568099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,4,power_law_1.01,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,4,power_law_1.01,0.2930624008178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,4,power_law_1.01,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,4,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,4,power_law_1.01,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,4,power_law_1.01,0.34406399726867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,4,power_law_1.01,0.3354624032974243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,4,power_law_1.01,0.3708928108215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,4,power_law_1.01,0.4937727928161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,4,power_law_1.01,0.5842944145202636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,4,power_law_1.01,0.8705920219421387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,4,power_law_1.01,1.132748794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,4,power_law_1.01,1.536409568786621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,4,power_law_1.01,2.324070358276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,4,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,4,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,4,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,4,power_law_1.2,0.030073601007461547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,4,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,4,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,4,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,4,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,4,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,4,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,4,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,4,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,4,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,4,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,4,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,4,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,4,power_law_1.2,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,4,power_law_1.2,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,4,power_law_1.2,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,4,power_law_1.01,2.8321792602539064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,4,power_law_1.2,0.2793215990066528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,4,power_law_1.2,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,4,power_law_1.2,0.5922815799713135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,4,power_law_1.2,0.9848832130432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,4,power_law_1.01,3.951001739501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,4,power_law_1.2,1.397555160522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,4,power_law_1.2,2.046342468261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,32,power_law_1.2,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,4,power_law_1.01,5.58653450012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,32,power_law_1.2,0.2924544095993042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,32,power_law_1.2,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,32,power_law_1.2,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,32,power_law_1.2,0.26972160339355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,32,power_law_1.2,0.265011191368103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,32,power_law_1.2,0.255180811882019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,32,power_law_1.2,0.2537472009658813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,32,power_law_1.2,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,32,power_law_1.2,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,32,power_law_1.2,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,32,power_law_1.2,0.2875391960144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,32,power_law_1.2,0.28917760848999025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,32,power_law_1.2,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,32,power_law_1.2,0.319488000869751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,32,power_law_1.2,0.3184639930725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,32,power_law_1.2,0.3028991937637329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,32,power_law_1.2,0.3495935916900635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,32,power_law_1.2,0.37867519855499265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,32,power_law_1.2,0.4415487766265869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,32,power_law_1.2,0.5066751956939697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,32,power_law_1.2,0.6840320110321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,4,power_law_1.2,2.8499967575073244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,32,power_law_1.2,1.0674176216125488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,32,power_law_1.2,1.500979232788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,32,power_law_1.2,1.7252351760864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,32,power_law_1.2,2.8082176208496095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,32,power_law_1.2,4.153753662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,32,power_law_1.01,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,32,power_law_1.01,0.2017280101776123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,32,power_law_1.01,0.20336639881134033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,32,power_law_1.01,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,32,power_law_1.01,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,32,power_law_1.01,0.17448960542678832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,32,power_law_1.01,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,32,power_law_1.01,0.11263999938964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,32,power_law_1.01,0.21299200057983397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,32,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,32,power_law_1.01,0.19517439603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,32,power_law_1.01,0.21954560279846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,32,power_law_1.01,0.2213887929916382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,32,power_law_1.01,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,32,power_law_1.01,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,32,power_law_1.01,0.22917120456695556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,32,power_law_1.01,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,32,power_law_1.01,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,32,power_law_1.01,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,32,power_law_1.01,0.3645440101623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,32,power_law_1.01,0.4317183971405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,32,power_law_1.01,0.5611455917358399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,32,power_law_1.01,0.7964672088623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,32,power_law_1.01,1.1225088119506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,32,power_law_1.01,1.5943679809570312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,32,power_law_1.01,2.2149120330810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,32,power_law_1.01,3.022233581542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,4,power_law_1.01,7.453286743164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,4,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,4,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,4,balanced,0.31112533807754517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,4,balanced,0.5910186767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,4,balanced,1.1221226851145427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,4,balanced,1.3888853391011555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,4,balanced,1.3941760063171387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,4,balanced,1.4008320172627766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,4,balanced,1.405610720316569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,4,balanced,1.4091946283976238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,4,balanced,1.4163626035054524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,4,balanced,1.4240427017211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,4,balanced,1.4308692614237468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,4,balanced,1.4453760782877605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,4,balanced,1.462272008260091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,4,balanced,1.5112533569335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,4,balanced,1.53275728225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,4,balanced,1.6040959358215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,4,balanced,1.6421546936035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,4,balanced,1.754111925760905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,4,balanced,1.7943785985310872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,1,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,1,balanced,0.08191999793052673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,4,balanced,2.053290685017904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,1,balanced,0.3056640028953552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,1,balanced,0.5915253162384033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,1,balanced,1.128618637720744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,4,balanced,2.3065600395202637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,1,balanced,1.4091946283976238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,1,balanced,1.4185813268025715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,4,balanced,2.8695894877115884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,1,balanced,1.4293333689371746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,1,balanced,1.4448639551798503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,1,balanced,1.4552747408548992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,4,balanced,3.602773348490397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,1,balanced,1.4810400009155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,1,balanced,1.5013440450032551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,1,balanced,1.5245653788248699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,1,balanced,1.5656852722167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,4,balanced,5.099856058756511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,1,balanced,1.6018773714701335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,1,balanced,1.6407893498738606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,1,balanced,1.723050594329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,1,balanced,1.8483200073242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,4,balanced,6.6889387766520185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,1,balanced,2.018474737803141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,1,balanced,2.368000030517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,1,balanced,2.689706802368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,1,balanced,3.5065174102783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,1,balanced,4.323840141296387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,1,balanced,5.968896230061849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,1,balanced,7.667370478312175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,1,balanced,10.944341023763021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,1,balanced,14.165674845377604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,1,balanced,0.5140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,1,balanced,0.8971947034200033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,1,balanced,1.7614506085713704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,1,balanced,1.73909330368042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,1,balanced,1.7774933179219563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,1,balanced,1.7532587051391602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,1,balanced,1.7648639678955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,1,balanced,1.7783466974894206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,1,balanced,1.7892692883809407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,1,balanced,1.795072078704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,1,balanced,1.8177706400553386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,1,balanced,1.840453306833903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,1,balanced,1.8546346028645833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,1,balanced,1.96725861231486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,1,balanced,2.008234659830729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,1,balanced,2.0329813957214355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,1,balanced,2.1358933448791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,1,balanced,2.739370663960775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,1,balanced,2.947413444519043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,1,balanced,3.6925439834594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,1,balanced,4.3116960525512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,1,balanced,5.924181620279948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,1,balanced,7.313045501708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,1,balanced,10.559130350748697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,1,balanced,13.996031443277994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,1,balanced,20.84334945678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,1,balanced,27.84119415283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,8,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,8,power_law_1.01,0.16977920532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,8,power_law_1.01,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,8,power_law_1.01,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,8,power_law_1.01,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,8,power_law_1.01,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,8,power_law_1.01,0.32604160308837893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,8,power_law_1.01,0.3123136043548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,8,power_law_1.01,0.29859840869903564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,8,power_law_1.01,0.30945279598236086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,8,power_law_1.01,0.33505280017852784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,8,power_law_1.01,0.32870399951934814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,8,power_law_1.01,0.3201024055480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,8,power_law_1.01,0.3487744092941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,8,power_law_1.01,0.3520512104034424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,8,power_law_1.01,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,8,power_law_1.01,0.37150719165802004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,8,power_law_1.01,0.3932159900665283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,8,power_law_1.01,0.39935998916625975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,8,power_law_1.01,0.4497407913208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,8,power_law_1.01,0.49930238723754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,8,power_law_1.01,0.5746687889099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,8,power_law_1.01,0.6504447937011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,8,power_law_1.01,0.8960000038146972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,8,power_law_1.01,1.2064767837524415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,8,power_law_1.01,1.7692672729492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,8,power_law_1.01,2.062335968017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,2,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,2,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,2,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,2,balanced,0.24473067124684653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,2,balanced,0.4538026650746663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,2,balanced,0.45670398076375324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,2,balanced,0.4585813283920288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,2,balanced,0.4608000119527181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,2,balanced,0.46353065967559814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,2,balanced,0.4647253354390462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,2,balanced,0.46199464797973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,2,balanced,0.4652373393376668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,2,balanced,0.4694986740748088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,2,balanced,0.48213334878285724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,2,balanced,0.4904959996541341
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,2,balanced,0.49851731459299725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,2,balanced,0.5092693169911703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,2,balanced,0.5399893522262573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,2,balanced,0.5645493268966675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,2,balanced,0.6220479806264242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,2,balanced,0.6797653039296468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,2,balanced,0.8287573655446371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,2,balanced,0.9697279930114746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,2,balanced,1.2535466353098552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,2,balanced,1.5982666015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,2,balanced,2.224298636118571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,2,balanced,2.976597468058268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,1,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,1,power_law_1.2,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,1,power_law_1.2,0.40673279762268066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,1,power_law_1.2,0.5908480167388916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,1,power_law_1.2,0.789299201965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,1,power_law_1.2,1.4516223907470702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,1,power_law_1.2,1.5040512084960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,1,power_law_1.2,1.5749119758605956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,1,power_law_1.2,1.621401596069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,1,power_law_1.2,1.6517120361328126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,1,power_law_1.2,1.7055744171142577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,1,power_law_1.2,1.7508352279663086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,1,power_law_1.2,1.7573888778686524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,1,power_law_1.2,1.7797119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,1,power_law_1.2,1.802854347229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,1,power_law_1.2,1.8575359344482423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,1,power_law_1.2,1.8585599899291991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,1,power_law_1.2,1.939244842529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,1,power_law_1.2,2.0707328796386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,1,power_law_1.2,2.3154687881469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,1,power_law_1.2,2.5530368804931642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,1,power_law_1.2,3.115827178955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,1,power_law_1.2,3.380633544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,16,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,16,power_law_1.2,0.2869247913360596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,16,power_law_1.2,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,16,power_law_1.2,0.39894399642944334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,16,power_law_1.2,0.411846399307251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,16,power_law_1.2,0.35184640884399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,1,power_law_1.2,4.360601425170898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,16,power_law_1.2,0.33873920440673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,16,power_law_1.2,0.3176448106765747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,16,power_law_1.2,0.3442431926727295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,16,power_law_1.2,0.35880959033966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,16,power_law_1.2,0.3631103992462158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,16,power_law_1.2,0.37068800926208495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,16,power_law_1.2,0.34037759304046633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,16,power_law_1.2,0.3852288007736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,16,power_law_1.2,0.406112003326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,16,power_law_1.2,0.4079616069793701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,16,power_law_1.2,0.38540799617767335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,16,power_law_1.2,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,16,power_law_1.2,0.4972544193267822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,16,power_law_1.2,0.5285888195037842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,16,power_law_1.2,0.5935103893280029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,16,power_law_1.2,0.7854080200195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,16,power_law_1.2,0.9566207885742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,16,power_law_1.2,1.3291520118713378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,16,power_law_1.2,1.8309120178222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,1,power_law_1.2,5.418803024291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,16,power_law_1.2,2.6802175521850584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,16,power_law_1.2,3.8758399963378904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,4,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,4,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,4,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,4,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,4,power_law_1.2,0.03234559893608093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,4,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,4,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,4,power_law_1.2,0.0358271986246109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,4,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,4,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,4,power_law_1.2,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,4,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,4,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,4,power_law_1.2,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,64,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,64,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,4,power_law_1.2,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,64,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,64,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,4,power_law_1.2,0.09646080136299133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,64,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,4,power_law_1.2,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,64,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,64,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,64,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,64,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,64,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,64,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,64,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,64,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,64,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,4,power_law_1.2,0.11816960573196411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,64,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,64,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,64,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,64,power_law_1.2,0.09400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,64,power_law_1.2,0.11448320150375366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,64,power_law_1.2,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,64,power_law_1.2,0.18780159950256348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,64,power_law_1.2,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,64,power_law_1.2,0.3078144073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,64,power_law_1.2,0.6121471881866455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,4,power_law_1.2,0.14991359710693358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,64,power_law_1.2,0.9654144287109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,64,power_law_1.2,1.4940159797668457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,64,power_law_1.2,2.002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,4,power_law_1.2,0.22036480903625488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,1,power_law_1.2,7.655814361572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,4,power_law_1.2,0.3569664001464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,4,power_law_1.2,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,32,power_law_1.01,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,32,power_law_1.01,0.35532801151275634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,32,power_law_1.01,0.3547136068344116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,32,power_law_1.01,0.3543040037155151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,32,power_law_1.01,0.3330048084259033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,32,power_law_1.01,0.34856960773468015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,32,power_law_1.01,0.341811203956604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,32,power_law_1.01,0.32829439640045166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,32,power_law_1.01,0.3157952070236206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,32,power_law_1.01,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,32,power_law_1.01,0.35880959033966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,4,power_law_1.2,0.6547455787658691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,32,power_law_1.01,0.35184640884399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,1,power_law_1.2,9.77776641845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,32,power_law_1.01,0.3565567970275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,32,power_law_1.01,0.34447360038757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,32,power_law_1.01,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,32,power_law_1.01,0.3649535894393921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,32,power_law_1.01,0.3858432054519653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,32,power_law_1.01,0.37703680992126465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,32,power_law_1.01,0.3831808090209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,32,power_law_1.01,0.4229119777679443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,32,power_law_1.01,0.5111807823181153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,32,power_law_1.01,0.6078464031219483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,32,power_law_1.01,0.7415808200836181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,32,power_law_1.01,1.064345645904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,32,power_law_1.01,1.2423168182373048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,32,power_law_1.01,1.8782207489013671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,32,power_law_1.01,2.3179264068603516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,4,power_law_1.2,1.0100735664367675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,4,power_law_1.2,1.4655488014221192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,2,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,2,balanced,0.09130666653315227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,2,balanced,0.3022506634394328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,2,balanced,0.589141329129537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,2,balanced,1.130837361017863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,2,balanced,1.4031999905904133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,2,balanced,1.4097065925598145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,2,balanced,1.4182400703430176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,2,balanced,1.423701286315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,2,balanced,1.4291626612345378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,2,balanced,1.443669319152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,2,balanced,1.4523733456929524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,2,balanced,1.470629374186198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,2,balanced,1.4982825915018718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,2,balanced,1.5168852806091309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,2,balanced,1.5697919527689617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,2,balanced,1.6155093510945637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,2,balanced,1.6943786938985188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,2,balanced,1.7935360272725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,2,balanced,1.9131733576456706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,2,balanced,2.085205396016439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,2,balanced,2.509141286214193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,2,balanced,2.960895856221517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,2,balanced,4.058112144470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,2,balanced,4.815183957417806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,2,balanced,6.842026392618815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,2,balanced,8.867328008015951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,4,power_law_1.2,2.60894718170166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,4,power_law_1.2,3.261439895629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,16,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,16,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,16,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,16,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,16,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,16,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,16,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,16,power_law_1.2,0.05815039873123169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,16,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,16,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,16,power_law_1.2,0.06305279731750488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,16,power_law_1.2,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,16,power_law_1.2,0.0686016023159027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,16,power_law_1.2,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,16,power_law_1.2,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,16,power_law_1.2,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,16,power_law_1.2,0.1183743953704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,16,power_law_1.2,0.18186240196228026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,16,power_law_1.2,0.24227840900421144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,16,power_law_1.2,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,16,power_law_1.2,0.5324416160583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,16,power_law_1.2,0.589414405822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,16,power_law_1.2,1.0450943946838378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,16,power_law_1.2,1.4237695693969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,16,power_law_1.2,2.4369152069091795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,16,power_law_1.2,3.194060707092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,8,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,8,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,8,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,8,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,8,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,8,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,8,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,8,power_law_1.01,0.03235200047492981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,8,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,8,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,8,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,8,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,8,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,8,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,8,power_law_1.01,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,8,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,8,power_law_1.01,0.25292799472808836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,8,power_law_1.01,0.33566720485687257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,8,power_law_1.01,0.5238783836364747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,8,power_law_1.01,0.8359935760498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,8,power_law_1.01,1.4729215621948242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,8,power_law_1.01,1.9353471755981446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,1,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,1,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,1,power_law_1.2,0.28998401165008547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,1,power_law_1.2,0.4933631896972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,1,power_law_1.2,0.6952960014343261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,1,power_law_1.2,0.9353216171264649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,1,power_law_1.2,1.4352383613586426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,1,power_law_1.2,1.5286272048950196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,1,power_law_1.2,1.6287744522094727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,1,power_law_1.2,1.6035839080810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,1,power_law_1.2,1.7053695678710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,1,power_law_1.2,1.8251775741577148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,1,power_law_1.2,1.8515968322753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,1,power_law_1.2,1.8954240798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,1,power_law_1.2,2.0189184188842773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,1,power_law_1.2,2.047590446472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,1,power_law_1.2,2.185817527770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,1,power_law_1.2,2.3830528259277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,1,power_law_1.2,2.5972736358642576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,1,power_law_1.2,2.9661184310913087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,1,power_law_1.2,3.4072574615478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,1,power_law_1.2,4.0796161651611325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,1,power_law_1.2,4.851507186889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,1,power_law_1.2,6.3920127868652346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,1,power_law_1.2,7.668729400634765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,1,power_law_1.2,10.794802856445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,1,power_law_1.2,13.982310485839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,1,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,1,power_law_1.01,0.18472959995269775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,1,power_law_1.01,0.36229119300842283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,32,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,1,power_law_1.01,0.5988351821899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,32,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,1,power_law_1.01,0.8669183731079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,32,power_law_1.01,0.031327998638153075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,32,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,32,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,32,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,32,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,32,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,32,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,32,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,1,power_law_1.01,1.4196736335754394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,1,power_law_1.01,1.545625591278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,1,power_law_1.01,1.5945728302001954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,32,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,1,power_law_1.01,1.6310272216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,32,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,32,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,1,power_law_1.01,1.680384063720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,32,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,32,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,32,power_law_1.01,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,1,power_law_1.01,1.7108991622924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,32,power_law_1.01,0.09441279768943786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,32,power_law_1.01,0.10649600028991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,32,power_law_1.01,0.1464319944381714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,1,power_law_1.01,1.7776639938354493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,32,power_law_1.01,0.19701759815216063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,32,power_law_1.01,0.2715456008911133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,1,power_law_1.01,1.7801216125488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,32,power_law_1.01,0.34816000461578367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,1,power_law_1.01,1.7917951583862304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,32,power_law_1.01,0.6002687931060791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,32,power_law_1.01,0.7192575931549072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,1,power_law_1.01,1.8585599899291991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,32,power_law_1.01,1.1823103904724122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,1,power_law_1.01,1.8884607315063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,1,power_law_1.01,1.9288063049316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,32,power_law_1.01,1.4692352294921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,1,power_law_1.01,1.9908607482910157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,1,power_law_1.01,2.068889617919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,1,power_law_1.01,2.2812671661376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,1,power_law_1.01,2.439571189880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,1,power_law_1.01,2.9028160095214846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,1,power_law_1.01,3.141836738586426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,1,power_law_1.01,3.992166519165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,1,power_law_1.01,4.673126220703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,1,power_law_1.01,6.451200103759765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,1,power_law_1.01,8.024063873291016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,1,balanced,0.25651200612386066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,1,balanced,0.45260798931121826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,1,balanced,0.8753493626912435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,1,balanced,1.7165652910868328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,1,balanced,3.3926827112833657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,1,balanced,3.4384212493896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,1,balanced,3.4554878870646157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,1,balanced,3.446613311767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,1,balanced,3.4583892822265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,1,balanced,3.474090576171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,1,balanced,3.525631904602051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,1,balanced,3.527338663736979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,1,balanced,3.548330624898275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,1,balanced,3.5857067108154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,1,balanced,3.631429354349772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,1,balanced,3.6700159708658853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,1,balanced,3.755690574645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,1,balanced,3.923797289530436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,1,balanced,4.105386734008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,1,balanced,4.4945065180460615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,1,balanced,4.7687679926554365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,1,balanced,5.018111864725749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,1,balanced,5.605536142985026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,1,balanced,7.160661061604817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,1,balanced,8.772607803344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,1,balanced,12.902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,1,balanced,17.246891021728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,32,balanced,0.047594666481018066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,32,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,32,balanced,0.04827733337879181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,32,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,32,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,32,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,32,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,32,balanced,0.056320001681645714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,32,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,32,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,32,balanced,0.05973333120346069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,32,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,32,balanced,0.06193066636721293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,32,balanced,0.06604800124963124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,32,balanced,0.06741333504517873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,32,balanced,0.08121066788832347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,32,balanced,0.1088800032933553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,32,balanced,0.14967466394106546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,32,balanced,0.2515626748402913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,32,balanced,0.29661866029103595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,32,balanced,0.36693334579467773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,32,balanced,0.4551626841227214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,32,balanced,0.6502399841944376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,32,balanced,0.8820052941640218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,32,balanced,1.2909226417541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,32,balanced,1.7087146441141765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,64,power_law_1.01,0.29409279823303225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,64,power_law_1.01,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,64,power_law_1.01,0.2985856056213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,64,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,64,power_law_1.01,0.23695359230041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,64,power_law_1.01,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,64,power_law_1.01,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,64,power_law_1.01,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,64,power_law_1.01,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,64,power_law_1.01,0.2934783935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,64,power_law_1.01,0.29614078998565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,64,power_law_1.01,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,64,power_law_1.01,0.2934783935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,64,power_law_1.01,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,64,power_law_1.01,0.32766079902648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,64,power_law_1.01,0.3192575931549072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,64,power_law_1.01,0.3378943920135498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,64,power_law_1.01,0.3375103950500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,64,power_law_1.01,0.3831808090209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,64,power_law_1.01,0.4413440227508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,64,power_law_1.01,0.5009088039398193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,64,power_law_1.01,0.6758399963378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,64,power_law_1.01,0.78438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,64,power_law_1.01,1.1718655586242677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,64,power_law_1.01,1.5867903709411622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,64,power_law_1.01,2.468454360961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,64,power_law_1.01,3.3366016387939452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,128,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,128,power_law_1.01,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,128,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,128,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,128,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,128,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,128,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,128,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,128,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,128,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,128,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,128,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,128,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,128,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,128,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,128,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,128,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,128,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,128,power_law_1.01,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,128,power_law_1.01,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,128,power_law_1.01,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,128,power_law_1.01,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,128,power_law_1.01,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,128,power_law_1.01,0.3780607938766479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,128,power_law_1.01,0.531660795211792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,128,power_law_1.01,0.8646656036376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,128,power_law_1.01,1.2011520385742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,8,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,8,balanced,0.02643733223279317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,8,balanced,0.027461332579453785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,8,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,8,balanced,0.19336533546447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,8,balanced,0.25651200612386066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,8,balanced,0.2573653260866801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,8,balanced,0.25787200530370075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,8,balanced,0.258730669816335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,8,balanced,0.2616320053736369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,8,balanced,0.2614506681760152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,8,balanced,0.2624640067418416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,8,balanced,0.26368000109990436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,8,balanced,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,8,balanced,0.27135999997456867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,8,balanced,0.27426133553187054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,8,balanced,0.27903467416763306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,8,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,8,balanced,0.3012266755104065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,8,balanced,0.31675734122594196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,8,balanced,0.33586664994557697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,8,balanced,0.3887786865234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,8,balanced,0.4198400179545085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,8,balanced,0.49544533093770343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,8,balanced,0.6010773181915283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,8,balanced,0.8654507001241049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,8,balanced,1.1864746411641438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,2,balanced,0.042490666111310325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,2,balanced,0.24369599421819052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,2,balanced,0.46114134788513184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,2,balanced,0.4614826838175456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,2,balanced,0.4614826838175456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,2,balanced,0.46436798572540283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,2,balanced,0.4664320151011149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,2,balanced,0.46916266282399494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,2,balanced,0.4724053144454956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,2,balanced,0.4747946659723918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,2,balanced,0.47889065742492676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,2,balanced,0.4814506769180298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,2,balanced,0.48468267917633057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,2,balanced,0.4910080035527547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,2,balanced,0.5048319896062216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,2,balanced,0.5111466646194458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,2,balanced,0.5300906499226888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,2,balanced,0.5978453159332275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,2,balanced,0.6586026748021444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,2,balanced,0.8506027062733968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,2,balanced,0.9934506416320801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,2,balanced,1.550506591796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,2,balanced,2.016767978668213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,2,balanced,3.0327466328938804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,2,balanced,4.029610633850098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,2,balanced,6.025386810302734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,2,balanced,7.845717112223308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,16,power_law_1.01,0.04136320054531097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,16,power_law_1.01,0.19107840061187745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,16,power_law_1.01,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,16,power_law_1.01,0.1632256031036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,16,power_law_1.01,0.1763327956199646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,16,power_law_1.01,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,16,power_law_1.01,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,16,power_law_1.01,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,16,power_law_1.01,0.09646080136299133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,16,power_law_1.01,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,16,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,16,power_law_1.01,0.08335360288619995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,16,power_law_1.01,0.1300480008125305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,16,power_law_1.01,0.13434879779815673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,16,power_law_1.01,0.14049279689788818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,16,power_law_1.01,0.16609280109405516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,16,power_law_1.01,0.18513920307159423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,16,power_law_1.01,0.20193281173706054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,16,power_law_1.01,0.18471039533615113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,16,power_law_1.01,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,16,power_law_1.01,0.2559999942779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,16,power_law_1.01,0.3180543899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,16,power_law_1.01,0.367411208152771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,16,power_law_1.01,0.5111807823181153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,16,power_law_1.01,0.6891520023345947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,16,power_law_1.01,1.0522496223449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,16,power_law_1.01,1.419264030456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,32,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,32,balanced,0.03958933303753535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,32,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,32,balanced,0.04026666780312856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,32,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,32,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,32,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,32,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,32,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,32,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,32,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,32,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,32,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,32,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,32,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,32,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,32,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,32,balanced,0.06843733290831248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,32,balanced,0.08550399541854858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,32,balanced,0.12663466731707254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,32,balanced,0.26077866554260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,32,balanced,0.3232426643371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,32,balanced,0.4870826800664266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,32,balanced,0.6580906709035238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,32,balanced,1.0067626635233562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,32,balanced,1.3300053278605144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,32,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,32,power_law_1.2,0.02375040054321289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,32,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,32,power_law_1.2,0.02353920042514801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,32,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,32,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,32,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,32,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,32,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,32,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,32,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,32,power_law_1.2,0.027014398574829103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,32,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,32,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,32,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,32,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,32,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,32,power_law_1.2,0.05754240155220032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,32,power_law_1.2,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,32,power_law_1.2,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,32,power_law_1.2,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,32,power_law_1.2,0.14725120067596437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,32,power_law_1.2,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,32,power_law_1.2,0.36618239879608155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,32,power_law_1.2,0.48496642112731936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,32,power_law_1.2,0.7012351989746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,32,power_law_1.2,1.010688018798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,16,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,16,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,16,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,16,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,16,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,16,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,16,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,16,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,16,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,16,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,16,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,16,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,16,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,1,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,16,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,1,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,16,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,1,power_law_1.01,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,1,power_law_1.01,0.1691648006439209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,16,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,1,power_law_1.01,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,16,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,1,power_law_1.01,0.3827584028244019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,16,power_law_1.01,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,1,power_law_1.01,0.397708797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,1,power_law_1.01,0.4255680084228516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,16,power_law_1.01,0.18698240518569947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,1,power_law_1.01,0.42455039024353025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,16,power_law_1.01,0.25763840675354005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,1,power_law_1.01,0.43702402114868166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,1,power_law_1.01,0.4483071804046631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,16,power_law_1.01,0.31784958839416505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,1,power_law_1.01,0.46284799575805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,16,power_law_1.01,0.4335616111755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,1,power_law_1.01,0.46448640823364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,1,power_law_1.01,0.4853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,16,power_law_1.01,0.5640192031860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,1,power_law_1.01,0.48824319839477537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,1,power_law_1.01,0.5074944019317627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,16,power_law_1.01,0.8501248359680176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,1,power_law_1.01,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,1,power_law_1.01,0.5789696216583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,16,power_law_1.01,1.16428804397583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,1,power_law_1.01,0.6242303848266602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,1,power_law_1.01,0.7352320194244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,1,power_law_1.01,0.8699904441833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,16,power_law_1.01,1.845452880859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,1,power_law_1.01,1.1337727546691894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,1,power_law_1.01,1.325055980682373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,16,power_law_1.01,2.674892807006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,1,power_law_1.01,1.8491392135620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,1,power_law_1.01,2.3531520843505858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,1,power_law_1.01,3.370393753051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,1,power_law_1.01,4.334592056274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,1,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,1,power_law_1.2,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,1,power_law_1.2,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,1,power_law_1.2,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,1,power_law_1.2,0.4253695964813232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,1,power_law_1.2,0.7495552062988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,1,power_law_1.2,0.7968768119812012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,1,power_law_1.2,0.8072896003723145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,1,power_law_1.2,0.8355839729309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,1,power_law_1.2,0.8558591842651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,1,power_law_1.2,0.8699904441833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,1,power_law_1.2,0.9078783988952637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,1,power_law_1.2,0.9154560089111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,1,power_law_1.2,0.9412351608276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,1,power_law_1.2,0.9773056030273437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,1,power_law_1.2,1.0063872337341309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,1,power_law_1.2,1.0579968452453614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,1,power_law_1.2,1.1745280265808105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,1,power_law_1.2,1.2795904159545899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,1,power_law_1.2,1.5060992240905762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,1,power_law_1.2,1.7496063232421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,1,power_law_1.2,2.208563232421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,1,power_law_1.2,2.576588821411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,1,power_law_1.2,3.4951103210449217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,8,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,8,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,8,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,8,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,8,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,8,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,8,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,8,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,8,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,8,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,8,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,8,balanced,0.04112533231576284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,8,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,8,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,8,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,8,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,8,balanced,0.08618666728337605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,8,balanced,0.10376532872517903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,8,balanced,0.2512213389078776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,8,balanced,0.3295573393503825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,8,balanced,0.49851731459299725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,8,balanced,0.6840319633483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,8,balanced,1.0536959966023762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,8,balanced,1.4472533861796062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,1,power_law_1.2,4.398662567138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,64,power_law_1.2,0.027641600370407103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,64,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,64,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,64,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,64,power_law_1.2,0.0286655992269516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,64,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,64,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,64,power_law_1.2,0.02988159954547882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,64,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,64,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,64,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,64,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,64,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,64,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,64,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,64,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,64,power_law_1.2,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,64,power_law_1.2,0.12963839769363403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,64,power_law_1.2,0.1581055998802185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,64,power_law_1.2,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,4,power_law_1.2,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,4,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,4,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,4,power_law_1.2,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,1,power_law_1.2,6.386687850952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,4,power_law_1.2,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,64,power_law_1.2,0.4016128063201904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,4,power_law_1.2,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,4,power_law_1.2,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,4,power_law_1.2,0.2549760103225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,4,power_law_1.2,0.25128960609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,4,power_law_1.2,0.23736319541931153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,4,power_law_1.2,0.26521599292755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,4,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,4,power_law_1.2,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,4,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,4,power_law_1.2,0.2934655904769897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,4,power_law_1.2,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,4,power_law_1.2,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,4,power_law_1.2,0.3704832077026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,4,power_law_1.2,0.40468478202819824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,4,power_law_1.2,0.5625855922698975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,4,power_law_1.2,0.7477248191833497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,4,power_law_1.2,1.1356160163879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,4,power_law_1.2,1.5116288185119628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,4,power_law_1.2,2.2648832321166994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,4,power_law_1.2,2.9519872665405273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,4,power_law_1.2,4.697702407836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,4,power_law_1.2,5.563801574707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,64,power_law_1.2,0.6250495910644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,64,power_law_1.2,0.8769536018371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,1,power_law_1.2,8.36669464111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,64,power_law_1.2,1.4858240127563476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,2,power_law_1.2,1.1413503646850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,2,power_law_1.2,1.6556032180786133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,2,power_law_1.2,2.853683280944824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,2,power_law_1.2,3.870105743408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,2,power_law_1.2,5.086822509765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,2,power_law_1.2,8.28067855834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,2,power_law_1.2,8.831795501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,2,power_law_1.2,9.263104248046876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,2,power_law_1.2,9.822796630859376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,2,power_law_1.2,9.566822052001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,2,power_law_1.2,10.200064086914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,2,power_law_1.2,10.497433471679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,2,power_law_1.2,10.249420928955079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,2,power_law_1.2,11.103231811523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,2,power_law_1.2,11.379507446289063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,2,power_law_1.2,11.272806549072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,2,power_law_1.2,11.57754898071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,64,power_law_1.2,1.9116031646728515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,2,power_law_1.2,12.358246612548829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,2,power_law_1.2,12.898098754882813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,1,power_law_1.2,0.20131840705871581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,1,power_law_1.2,0.36024320125579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,2,power_law_1.2,13.655616760253906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,1,power_law_1.2,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,1,power_law_1.2,1.1978752136230468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,1,power_law_1.2,1.7539072036743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,1,power_law_1.2,2.392268753051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,1,power_law_1.2,3.7130176544189455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,2,power_law_1.2,16.590425109863283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,1,power_law_1.2,3.778969573974609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,1,power_law_1.2,4.043161773681641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,1,power_law_1.2,4.0015617370605465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,1,power_law_1.2,4.109926223754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,2,power_law_1.2,20.180172729492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,1,power_law_1.2,4.434329605102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,1,power_law_1.2,4.464640045166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,1,power_law_1.2,4.7355903625488285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,1,power_law_1.2,4.764057540893555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,2,power_law_1.2,19.89710693359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,1,power_law_1.2,4.871987152099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,1,power_law_1.2,5.0745281219482425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,1,power_law_1.2,5.320908737182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,1,power_law_1.2,5.5523326873779295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,2,power_law_1.2,23.59477081298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,1,power_law_1.2,5.699993515014649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,1,power_law_1.2,6.046105575561524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,1,power_law_1.2,6.824550628662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,1,power_law_1.2,7.564288330078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,1,power_law_1.2,9.254502105712891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,2,power_law_1.2,28.476007080078126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,1,power_law_1.2,11.094617462158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,2,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,2,power_law_1.2,0.235315203666687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,2,power_law_1.2,0.3907583951950073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,2,power_law_1.2,0.49889278411865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,2,power_law_1.2,0.6444992065429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,2,power_law_1.2,1.0395648002624511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,2,power_law_1.2,1.1651071548461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,2,power_law_1.2,1.220588779449463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,1,power_law_1.2,14.797415161132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,2,power_law_1.2,1.2392448425292968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,2,power_law_1.2,1.265664005279541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,2,power_law_1.2,1.3195263862609863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,2,power_law_1.2,1.3752320289611817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,2,power_law_1.2,1.367859172821045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,2,power_law_1.2,1.4014464378356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,2,power_law_1.2,1.4792703628540038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,2,power_law_1.2,1.4782464027404785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,1,power_law_1.2,17.288787841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,2,power_law_1.2,1.5052800178527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,2,power_law_1.2,1.6684991836547851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,2,power_law_1.2,1.7801216125488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,2,power_law_1.2,1.944166374206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,2,power_law_1.2,2.1903360366821287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,2,power_law_1.2,38.677703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,2,power_law_1.2,2.6820608139038087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,2,power_law_1.2,3.3710079193115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,2,power_law_1.2,4.49536018371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,2,power_law_1.2,5.126144027709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,2,power_law_1.2,7.678975677490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,2,power_law_1.2,46.46051940917969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,2,power_law_1.2,9.882828521728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,2,power_law_1.01,0.7749631881713868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,2,power_law_1.01,0.734003210067749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,2,power_law_1.01,1.277337646484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,2,power_law_1.01,1.702707290649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,2,power_law_1.01,1.7774591445922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,2,power_law_1.01,1.7922048568725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,2,power_law_1.01,1.8585599899291991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,2,power_law_1.01,2.226380729675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,2,power_law_1.01,2.401894378662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,2,power_law_1.01,2.326323127746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,2,power_law_1.01,2.203647994995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,2,power_law_1.01,2.4809471130371095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,2,power_law_1.01,2.7463680267333985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,2,power_law_1.01,3.160268783569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,2,power_law_1.01,3.3284095764160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,2,power_law_1.01,3.4525184631347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,1,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,1,power_law_1.2,0.02741760015487671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,2,power_law_1.01,4.303462219238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,1,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,1,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,1,power_law_1.2,0.062015998363494876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,1,power_law_1.2,0.20807039737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,1,power_law_1.2,0.21890559196472167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,2,power_law_1.01,5.06798095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,1,power_law_1.2,0.23036799430847169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,1,power_law_1.2,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,1,power_law_1.2,0.237772798538208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,1,power_law_1.2,0.24060800075531005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,1,power_law_1.2,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,1,power_law_1.2,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,1,power_law_1.2,0.28180480003356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,1,power_law_1.2,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,1,power_law_1.2,0.2791424036026001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,1,power_law_1.2,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,1,power_law_1.2,0.3436543941497803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,2,power_law_1.01,6.505267333984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,1,power_law_1.2,0.3614720106124878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,1,power_law_1.2,0.4345856189727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,1,power_law_1.2,0.5181439876556396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,1,power_law_1.2,0.7458816051483155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,2,power_law_1.01,8.092057800292968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,1,power_law_1.2,1.0059776306152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,1,power_law_1.2,1.4784511566162108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,4,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,4,balanced,0.0692853331565857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,4,balanced,0.2795520027478536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,4,balanced,0.5423786640167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,2,power_law_1.01,8.955897521972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,4,balanced,1.0369706948598225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,4,balanced,2.026149272918701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,4,balanced,2.0334933598836265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,4,balanced,2.035029411315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,4,balanced,2.042367935180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,4,balanced,2.0478293100992837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,4,balanced,2.0522665977478027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,4,balanced,2.066090742746989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,4,balanced,2.073088010152181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,4,balanced,2.0889600118001304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,4,balanced,2.1118292808532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,4,balanced,2.125823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,4,balanced,2.1642239888509116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,4,balanced,2.272768020629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,4,balanced,2.3393279711405435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,4,balanced,2.4586240450541177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,4,balanced,2.694997469584147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,4,balanced,2.9298346837361655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,4,balanced,3.0911146799723306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,4,balanced,3.7119998931884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,4,balanced,4.314794540405273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,2,power_law_1.01,11.29349136352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,4,balanced,5.699583689371745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,4,balanced,7.110144297281901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,2,power_law_1.01,13.123788452148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,2,power_law_1.01,17.674649047851563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,1,power_law_1.2,1.9216384887695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,4,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,4,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,4,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,4,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,4,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,4,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,4,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,4,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,4,power_law_1.2,0.027635198831558228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,4,power_law_1.2,0.02824319899082184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,4,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,4,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,4,power_law_1.2,0.030502399802207945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,4,power_law_1.2,0.034380799531936644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,4,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,4,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,4,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,4,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,2,power_law_1.01,22.33507843017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,4,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,4,power_law_1.2,0.10199040174484253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,4,power_law_1.2,0.13312000036239624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,4,power_law_1.2,0.23446400165557862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,2,power_law_1.01,33.10653381347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,4,power_law_1.2,0.34037759304046633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,1,power_law_1.2,2.794905662536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,4,power_law_1.2,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,4,power_law_1.2,0.7329792022705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,2,power_law_1.01,31.72392883300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,1,power_law_1.2,3.710540771484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,4,power_law_1.2,1.2748800277709962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,1,balanced,1.0038613478342693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,1,balanced,1.7759572664896648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,1,balanced,3.5022506713867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,1,balanced,3.51197878519694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,1,balanced,3.5290454228719077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,1,balanced,3.533994674682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,1,balanced,3.525631904602051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,1,balanced,3.5485013326009116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,1,balanced,3.6672852834065757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,1,balanced,3.6780373255411782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,1,balanced,3.7229226430257163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,1,balanced,3.7503840128580728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,1,balanced,3.775146802266439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,1,balanced,3.815765380859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,1,balanced,5.720405578613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,1,balanced,5.818880081176758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,1,balanced,5.897216161092122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,1,balanced,8.012629191080729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,1,balanced,9.076730728149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,8,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,8,balanced,0.036330667634805046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,8,balanced,0.03666666646798452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,8,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,8,balanced,0.040949332217375435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,1,balanced,10.250069300333658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,8,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,8,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,8,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,8,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,8,balanced,0.04674666623274485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,8,balanced,0.04828799764315287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,8,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,8,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,8,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,8,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,8,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,8,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,8,balanced,0.07217066486676534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,8,balanced,0.0960586667060852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,8,balanced,0.15495466192563376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,8,balanced,0.24320000410079956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,8,balanced,0.30395734310150146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,8,balanced,0.4179626703262329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,8,balanced,0.5452800194422404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,1,balanced,12.428799947102865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,8,balanced,0.8811306953430176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,8,balanced,1.2856319745381672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,1,balanced,15.296512603759766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,1,balanced,18.68595250447591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,1,balanced,24.42376454671224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,4,power_law_1.2,1.6013311386108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,1,balanced,29.525670369466145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,1,balanced,40.922281901041664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,1,balanced,51.93403625488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,8,power_law_1.2,0.46776318550109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,8,power_law_1.2,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,8,power_law_1.2,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,8,power_law_1.2,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,8,power_law_1.2,0.4718592166900635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,8,power_law_1.2,0.48107519149780276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,8,power_law_1.2,0.6438911914825439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,8,power_law_1.2,0.7530496120452881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,8,power_law_1.2,0.873472023010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,8,power_law_1.2,0.9361408233642579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,8,power_law_1.2,0.8071167945861817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,8,power_law_1.2,0.9805824279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,8,power_law_1.2,1.1573247909545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,8,power_law_1.2,1.4082048416137696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,8,power_law_1.2,1.6324607849121093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,8,power_law_1.2,2.009292793273926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,8,power_law_1.2,2.377728080749512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,8,power_law_1.2,3.319193649291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,8,power_law_1.2,4.270489501953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,8,power_law_1.2,5.419827270507812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,8,power_law_1.2,6.246809768676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,8,power_law_1.2,8.135475158691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,8,power_law_1.2,9.314713287353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,8,power_law_1.2,12.53191680908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,8,power_law_1.2,16.100755310058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,64,power_law_1.01,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,64,power_law_1.01,0.22609920501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,64,power_law_1.01,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,64,power_law_1.01,0.2258944034576416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,64,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,64,power_law_1.01,0.1171455979347229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,64,power_law_1.01,0.16302080154418946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,64,power_law_1.01,0.19456000328063966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,64,power_law_1.01,0.20992000102996827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,64,power_law_1.01,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,64,power_law_1.01,0.2224128007888794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,64,power_law_1.01,0.22036480903625488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,64,power_law_1.01,0.22282240390777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,64,power_law_1.01,0.24432640075683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,64,power_law_1.01,0.19967360496520997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,64,power_law_1.01,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,64,power_law_1.01,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,64,power_law_1.01,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,64,power_law_1.01,0.33320319652557373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,64,power_law_1.01,0.3758080005645752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,64,power_law_1.01,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,64,power_law_1.01,0.47656960487365724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,64,power_law_1.01,0.6334464073181152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,64,power_law_1.01,0.9263104438781739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,64,power_law_1.01,1.173299217224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,64,power_law_1.01,1.8872255325317382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,64,power_law_1.01,2.52805118560791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,32,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,32,balanced,0.02372266600529353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,32,balanced,0.02387733260790507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,32,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,32,balanced,0.025413334369659424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,32,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,32,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,32,balanced,0.026608000199000042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,32,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,32,balanced,0.026613332331180573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,32,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,32,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,32,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,32,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,32,balanced,0.0310506671667099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,32,balanced,0.031888000667095184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,32,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,32,balanced,0.03649600098530451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,32,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,32,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,32,balanced,0.07098666826883952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,32,balanced,0.07321600119272868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,32,balanced,0.19950934251149496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,32,balanced,0.26436267296473187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,32,balanced,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,32,balanced,0.5405013163884481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,8,power_law_1.2,20.04111328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,1,power_law_1.2,1.7663936614990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,1,power_law_1.2,2.8289024353027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,1,power_law_1.2,3.5104766845703126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,1,power_law_1.2,6.609919738769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,1,power_law_1.2,6.803250885009765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,1,power_law_1.2,7.001292419433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,1,power_law_1.2,7.615487670898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,1,power_law_1.2,7.978150177001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,1,power_law_1.2,8.588082885742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,1,power_law_1.2,8.939315032958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,1,power_law_1.2,8.13342742919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,1,power_law_1.2,8.910848236083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,1,power_law_1.2,9.384960174560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,1,power_law_1.2,10.402816009521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,1,power_law_1.2,11.813887786865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,1,power_law_1.2,12.986778259277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,1,power_law_1.2,14.859878540039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,1,power_law_1.2,19.988890075683592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,16,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,16,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,16,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,16,balanced,0.2802346746126811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,16,balanced,0.5384533405303955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,16,balanced,1.0390186309814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,16,balanced,1.0426026980082195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,16,balanced,1.0466986497243245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,16,balanced,1.0482186476389568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,16,balanced,1.047381321589152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,1,power_law_1.2,23.621221923828124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,16,balanced,1.052671988805135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,16,balanced,1.0579626560211182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,16,balanced,1.0588160355885823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,16,balanced,1.067519982655843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,16,balanced,1.074005365371704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,16,balanced,1.0781013170878093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,16,balanced,1.0938026905059814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,16,balanced,1.1345919768015544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,16,balanced,1.1586559613545735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,16,balanced,1.2016639709472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,16,balanced,1.2506453196207683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,16,balanced,1.3991252581278484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,16,balanced,1.4735360145568848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,16,balanced,1.6692907015482585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,16,balanced,2.0208640098571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,16,balanced,2.5815040270487466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,16,balanced,3.09879461924235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,1,power_law_1.2,29.408657836914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,1,power_law_1.2,32.30781555175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,8,power_law_1.2,27.481906127929687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,1,power_law_1.2,40.51968078613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,1,power_law_1.2,45.65278625488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,1,power_law_1.2,60.5497314453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,8,power_law_1.01,0.316211199760437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,8,power_law_1.01,0.5513216018676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,8,power_law_1.01,1.0588159561157227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,8,power_law_1.01,0.9226240158081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,8,power_law_1.01,1.0819583892822267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,8,power_law_1.01,1.371340847015381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,8,power_law_1.01,1.2005375862121581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,8,power_law_1.01,1.3451135635375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,8,power_law_1.01,1.3764608383178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,8,power_law_1.01,1.1692031860351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,8,power_law_1.01,1.4141440391540527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.08191999793052673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,8,power_law_1.01,1.347379207611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.22220799922943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.3268608093261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.48762879371643064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,8,power_law_1.01,1.367039966583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.4779967784881592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.5326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.5367807865142822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,8,power_law_1.01,1.2996607780456544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.5421055793762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,8,power_law_1.01,1.4016511917114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.5476352214813233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.5511168003082275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,8,power_law_1.01,1.3953023910522462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.5631807804107666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.5855231761932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,8,power_law_1.01,1.429088020324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.5679103851318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,8,power_law_1.01,1.542745590209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.610918378829956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,8,power_law_1.01,1.657222366333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.6305791854858398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.7063551902770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,8,power_law_1.01,1.7387519836425782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,8,power_law_1.01,1.8571264266967773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.7798399925231934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,8,power_law_1.01,2.127859115600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,8,power_law_1.01,2.4008703231811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.830668830871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,8,power_law_1.01,3.2905086517333983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,8,power_law_1.01,3.6704254150390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,1,power_law_1.01,1.0999808311462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,8,power_law_1.01,5.070028686523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,8,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,8,power_law_1.01,5.801984024047852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,1,power_law_1.01,1.3299712181091308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,8,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,8,power_law_1.2,0.22977280616760254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,8,power_law_1.2,0.2248447895050049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,8,power_law_1.2,0.32378880977630614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,8,power_law_1.2,0.3905535936355591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,8,power_law_1.2,0.37601280212402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,8,power_law_1.2,0.323142409324646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,8,power_law_1.2,0.30453760623931886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,8,power_law_1.2,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,1,power_law_1.01,1.8431999206542968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,8,power_law_1.2,0.35389440059661864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,8,power_law_1.2,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,8,power_law_1.2,0.3907455921173096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,8,power_law_1.2,0.3948415994644165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,8,power_law_1.2,0.39137279987335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,1,power_law_1.01,2.345574378967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,8,power_law_1.2,0.4009984016418457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,8,power_law_1.2,0.4302847862243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,8,power_law_1.2,0.46837759017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,8,power_law_1.2,0.5236608028411865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,8,power_law_1.2,0.596992015838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,8,power_law_1.2,0.6957056045532226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,8,power_law_1.2,0.9144319534301758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,8,power_law_1.2,1.127014446258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,8,power_law_1.2,1.5820799827575684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,8,power_law_1.2,2.1116928100585937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,8,power_law_1.2,3.053363227844238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,8,power_law_1.2,4.168294525146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,1,power_law_1.01,3.423436737060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,1,power_law_1.2,71.12396850585938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,1,power_law_1.01,4.468294525146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,1,power_law_1.01,6.217113494873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,1,power_law_1.2,96.39751586914062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,1,power_law_1.01,8.056626892089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,1,power_law_1.2,119.55076904296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,4,power_law_1.01,1.096288013458252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,4,power_law_1.01,2.072153663635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,4,power_law_1.01,2.551193618774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,4,power_law_1.01,3.8367233276367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,4,power_law_1.01,4.499660873413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,4,power_law_1.01,4.837785720825195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,4,power_law_1.01,6.293503952026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,4,power_law_1.01,6.056345748901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,4,power_law_1.01,6.458367919921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,4,power_law_1.01,6.760447692871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,4,power_law_1.01,6.9263359069824215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,4,power_law_1.01,7.088947296142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,4,power_law_1.01,6.944358062744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,4,power_law_1.01,7.061504364013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,4,power_law_1.01,7.382425689697266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,4,power_law_1.01,7.337165069580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,4,power_law_1.01,8.323468780517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,4,power_law_1.01,8.58787841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,4,power_law_1.01,8.523961639404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,2,power_law_1.01,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,2,power_law_1.01,0.6768640041351318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,2,power_law_1.01,1.0024959564208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,4,power_law_1.01,9.027993774414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,2,power_law_1.01,1.6168960571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,2,power_law_1.01,2.347417640686035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,2,power_law_1.01,3.040665626525879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,4,power_law_1.01,9.698099517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,2,power_law_1.01,3.9776256561279295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,2,power_law_1.01,3.9006206512451174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,4,power_law_1.01,10.48616943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,2,power_law_1.01,4.180172729492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,2,power_law_1.01,4.274380874633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,4,power_law_1.01,11.494790649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,2,power_law_1.01,4.315750503540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,2,power_law_1.01,4.438016128540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,2,power_law_1.01,4.5070335388183596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,4,power_law_1.01,14.306918334960937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,2,power_law_1.01,4.777779388427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,2,power_law_1.01,4.694220733642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,2,power_law_1.01,4.755456161499024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,4,power_law_1.01,15.920127868652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,2,power_law_1.01,4.78924789428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,2,power_law_1.01,4.909260940551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,2,power_law_1.01,5.057740783691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,2,power_law_1.01,5.449523162841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,4,power_law_1.01,21.304115295410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,2,power_law_1.01,5.627494430541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,2,power_law_1.01,6.574694061279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,2,power_law_1.01,6.967705535888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,4,power_law_1.01,26.013900756835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,2,power_law_1.01,8.286617279052734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,2,power_law_1.01,9.465856170654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,2,power_law_1.01,12.108595275878907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,2,power_law_1.01,15.60248260498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,16,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,16,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,16,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,16,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,16,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,16,power_law_1.2,0.04709759950637817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,16,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,16,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,16,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,16,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,16,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,16,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,16,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,16,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,16,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,16,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,16,power_law_1.2,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,16,power_law_1.2,0.12083200216293336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,16,power_law_1.2,0.1906496047973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,16,power_law_1.2,0.2541568040847778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,16,power_law_1.2,0.3416064023971558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,16,power_law_1.2,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,16,power_law_1.2,0.591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,16,power_law_1.2,0.9646080017089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,16,power_law_1.2,1.3559807777404784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,16,power_law_1.2,2.168012809753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,16,power_law_1.2,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,16,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,16,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,16,power_law_1.2,3.1653888702392576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,16,power_law_1.2,0.029267200827598573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,16,power_law_1.2,0.02884480059146881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,16,power_law_1.2,0.029862400889396668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,16,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,16,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,16,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,16,power_law_1.2,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,16,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,16,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,16,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,16,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,16,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,16,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,16,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,16,power_law_1.2,0.05118719935417175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,16,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,16,power_law_1.2,0.09379199743270875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,16,power_law_1.2,0.10711040496826171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,16,power_law_1.2,0.16650240421295165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,16,power_law_1.2,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,16,power_law_1.2,0.3719167947769165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,16,power_law_1.2,0.5099520206451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,16,power_law_1.2,0.8529919624328614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,16,power_law_1.2,1.2380160331726073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,4,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,4,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,4,balanced,0.17698132991790771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,4,balanced,0.3541333278020223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,4,balanced,0.672426700592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,4,balanced,1.3013333479563396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,4,balanced,1.3064533074696858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,4,balanced,1.3100266456604004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,4,balanced,1.3142986297607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,4,balanced,1.317034641901652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,4,balanced,1.3228373527526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,4,balanced,1.3306879997253418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,4,balanced,1.3370025952657063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,4,balanced,1.3477439880371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,4,balanced,1.3591893513997395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,4,balanced,1.3685760498046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,4,balanced,1.3887146313985188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,4,balanced,1.4252373377482097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,4,balanced,1.4634666442871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,4,balanced,1.5482880274454753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,4,balanced,1.6324267387390137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,4,balanced,1.7256107330322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,4,balanced,1.8614613215128581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,4,balanced,2.1167786916097007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,4,balanced,2.453674634297689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,4,balanced,3.120981216430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,4,balanced,3.9563945134480796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,4,balanced,0.3447466691335042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,4,balanced,0.5869226853052775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,4,balanced,1.129642645517985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,4,balanced,2.2277119954427085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,4,balanced,4.42299747467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,4,balanced,5.49836794535319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,4,balanced,5.523626963297526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,4,balanced,5.390677134195964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,4,balanced,5.401429494222005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,4,balanced,5.409791946411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,4,balanced,5.427370707194011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,4,balanced,5.442560195922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,4,balanced,5.461162567138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,4,balanced,5.486421585083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,4,balanced,5.534208297729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,4,balanced,5.729109446207683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,4,balanced,5.780650456746419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,4,balanced,5.917184193929036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,4,balanced,5.99620246887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,4,balanced,6.935722351074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,128,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,128,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,128,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,128,balanced,0.023200000325838726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,128,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,128,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,128,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,128,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,128,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,4,balanced,7.261861165364583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,128,balanced,0.02474133421977361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,4,balanced,7.660885492960612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,128,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,128,balanced,0.025936000049114227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,128,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,128,balanced,0.026613332331180573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,128,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,128,balanced,0.028666667640209198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,128,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,128,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,128,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,128,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,128,balanced,0.03734400123357773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,128,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,128,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,128,balanced,0.06348800162474315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,128,balanced,0.1088853379090627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,4,balanced,7.650645573933919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,128,balanced,0.26026666164398193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,128,balanced,0.35601067543029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,4,balanced,9.415850957234701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,4,balanced,10.63321622212728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,4,balanced,13.894143422444662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,4,balanced,17.778004964192707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,2,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,2,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,2,balanced,0.2754559914271037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,2,balanced,0.2752853234608968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,2,balanced,0.27801599105199176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,2,balanced,0.28040534257888794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,2,balanced,0.28226133187611896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,2,balanced,0.28945066531499225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,2,balanced,0.28737600644429523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,2,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,2,balanced,0.29180800914764404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,2,balanced,0.28962133328119916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,2,balanced,0.291157325108846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,2,balanced,0.2984960079193115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,2,balanced,0.306005338827769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,2,balanced,0.3222133318583171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,2,balanced,0.3179519971211751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,2,balanced,0.3653973340988159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,2,balanced,0.3805866638819377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,2,balanced,0.4604586760203044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,2,balanced,0.5507413148880005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,2,balanced,0.8118613560994467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,2,balanced,1.0929493109385173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,2,balanced,1.6358399391174316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,2,balanced,2.2210559844970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,2,balanced,3.260234514872233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,2,balanced,4.406271934509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,128,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,128,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,128,power_law_1.2,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,128,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,128,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,128,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,128,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,128,power_law_1.2,0.03704319894313812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,128,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,128,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,128,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,128,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,128,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,128,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,128,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,128,power_law_1.2,0.046265599131584165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,128,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,128,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,128,power_law_1.2,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,128,power_law_1.2,0.09992319941520691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,128,power_law_1.2,0.12983039617538453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.2910207986831665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,128,power_law_1.2,0.17141760587692262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,128,power_law_1.2,0.26071040630340575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,128,power_law_1.2,0.4395008087158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,128,power_law_1.2,0.5296127796173096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,128,power_law_1.2,0.7813119888305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,1,power_law_1.01,1.0356736183166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,128,power_law_1.2,1.3113280296325684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,1,power_law_1.01,1.8305023193359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,1,power_law_1.01,2.6472448348999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,1,power_law_1.01,3.0656511306762697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,1,power_law_1.01,3.972915267944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,1,power_law_1.01,4.220313644409179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,1,power_law_1.01,4.4130302429199215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,1,power_law_1.01,4.477337646484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,1,power_law_1.01,4.708966445922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,1,power_law_1.01,4.78392333984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,1,power_law_1.01,4.979302215576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,1,power_law_1.01,5.206220626831055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,1,power_law_1.01,5.278924942016602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,1,power_law_1.01,5.638348770141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,1,power_law_1.01,6.057779312133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,1,power_law_1.01,6.337331390380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,1,power_law_1.01,6.901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,1,power_law_1.01,7.5886589050292965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,1,power_law_1.01,8.650956726074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,1,power_law_1.01,9.402777862548827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,4,power_law_1.01,0.21564159393310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,1,power_law_1.01,11.57611541748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,4,power_law_1.01,0.39731199741363527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,4,power_law_1.01,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,4,power_law_1.01,0.5558271884918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,4,power_law_1.01,0.7161856174468995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,4,power_law_1.01,0.9904128074645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,1,power_law_1.01,13.345382690429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,4,power_law_1.01,0.9684991836547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,4,power_law_1.01,0.9854975700378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,4,power_law_1.01,0.9469951629638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,4,power_law_1.01,0.939417552947998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,4,power_law_1.01,0.9326592445373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,4,power_law_1.01,1.0489855766296388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,4,power_law_1.01,1.0491904258728026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,4,power_law_1.01,1.055129623413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,1,power_law_1.01,17.95379180908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,4,power_law_1.01,1.1018239974975585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,4,power_law_1.01,1.1069439888000487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,4,power_law_1.01,1.1587583541870117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,4,power_law_1.01,1.2515328407287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,4,power_law_1.01,1.3639679908752442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,4,power_law_1.01,1.6050176620483398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,4,power_law_1.01,1.9369983673095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,4,power_law_1.01,2.4012800216674806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,1,power_law_1.01,21.569740295410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,4,power_law_1.01,2.679193687438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,4,power_law_1.01,3.7974014282226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,4,power_law_1.01,4.461772918701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,4,power_law_1.01,6.6467842102050785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,4,power_law_1.01,8.694989013671876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,8,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,8,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,8,power_law_1.01,0.2902015924453735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,8,power_law_1.01,0.25804800987243653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,8,power_law_1.01,0.3190783977508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,8,power_law_1.01,0.35942399501800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,8,power_law_1.01,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,8,power_law_1.01,0.36637439727783205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,8,power_law_1.01,0.39935998916625975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,8,power_law_1.01,0.40755200386047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,8,power_law_1.01,0.3794944047927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,8,power_law_1.01,0.3631103992462158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,8,power_law_1.01,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,8,power_law_1.01,0.3901439905166626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,8,power_law_1.01,0.37845120429992674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,8,power_law_1.01,0.42270717620849607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,8,power_law_1.01,0.4306943893432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,8,power_law_1.01,0.4655104160308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,8,power_law_1.01,0.5072896003723144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,8,power_law_1.01,0.591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,8,power_law_1.01,0.669491195678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,8,power_law_1.01,0.8499199867248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,8,power_law_1.01,1.0831744194030761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,8,power_law_1.01,1.4784511566162108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,8,power_law_1.01,1.9009536743164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,8,power_law_1.01,2.860646438598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,8,power_law_1.01,3.684966278076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,1,balanced,0.1544533371925354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,1,balanced,0.34781865278879803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,1,balanced,0.6685012976328532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,1,balanced,1.3054292996724446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,1,balanced,2.5654613176981607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,1,balanced,5.082624117533366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,1,balanced,5.095909436543782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,1,balanced,5.108736038208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,1,balanced,5.119999885559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,1,balanced,5.131264050801595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,1,balanced,5.1532745361328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,1,balanced,5.174442609151204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,1,balanced,5.191509246826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,1,balanced,5.229909261067708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,1,balanced,5.268992106119792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,1,balanced,5.305002530415853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,1,balanced,5.372416178385417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,1,balanced,5.683882395426433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,1,balanced,5.813077290852864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,1,balanced,5.868031819661458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,1,balanced,6.182229359944661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,1,balanced,6.47543462117513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,1,balanced,6.910122553507487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,1,balanced,7.85868771870931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,1,balanced,8.782480239868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,1,balanced,11.41043217976888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,1,balanced,14.125226338704428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,2,balanced,0.05272533496220907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,2,balanced,0.05526400109132131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,2,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,2,balanced,0.08669867118199666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,2,balanced,0.30856533845265705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,2,balanced,0.3877546787261963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,2,balanced,0.3927040100097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,2,balanced,0.39713064829508465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,2,balanced,0.4031146764755249
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,2,balanced,0.40635732809702557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,2,balanced,0.41557331879933673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,2,balanced,0.4251306851704915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,2,balanced,0.43263999621073407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,2,balanced,0.4478293259938558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,2,balanced,0.46506667137145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,2,balanced,0.4797439972559611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,2,balanced,0.505514661471049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,2,balanced,0.5614933172861735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,2,balanced,0.6294186512629191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,2,balanced,0.814250628153483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,2,balanced,1.017514705657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,2,balanced,1.4484373728434246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,2,balanced,1.8643627166748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,8,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,8,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,8,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,8,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,8,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,8,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,2,balanced,2.7514880498250327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,2,balanced,3.6065279642740884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,8,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,8,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,8,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,8,balanced,0.038560000558694206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,8,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,8,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,8,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,8,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,8,balanced,0.05973333120346069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,2,balanced,5.315925280253093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,8,balanced,0.09710933764775594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,8,balanced,0.08755200107892354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,8,balanced,0.15018666783968607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,8,balanced,0.16315733393033346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,8,balanced,0.26316799720128375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,8,balanced,0.4131840070088704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,8,balanced,0.6128640174865723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,8,balanced,0.8499200344085693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,2,balanced,7.036757151285808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,2,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,2,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,2,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,2,power_law_1.2,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,2,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,2,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,2,power_law_1.2,0.07639039754867553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,2,power_law_1.2,0.08622080087661743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,2,power_law_1.2,0.0894976019859314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,2,power_law_1.2,0.09314560294151306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,2,power_law_1.2,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,2,power_law_1.2,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,2,power_law_1.2,0.16343040466308595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,2,power_law_1.2,0.18431999683380126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,2,power_law_1.2,0.18677760362625123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,2,power_law_1.2,0.21954560279846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,2,power_law_1.2,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,2,power_law_1.2,0.2668544054031372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,2,power_law_1.2,0.3037184000015259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,2,power_law_1.2,0.3811327934265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,2,power_law_1.2,0.44810237884521487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,2,power_law_1.2,0.7038976192474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,2,power_law_1.2,0.9447423934936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,2,power_law_1.2,1.427660846710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,2,power_law_1.2,2.048204803466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,2,power_law_1.2,2.991103935241699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,2,power_law_1.2,3.688857650756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,4,power_law_1.2,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,4,power_law_1.2,0.35614719390869143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,4,power_law_1.2,0.4257791996002197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,4,power_law_1.2,0.4958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,4,power_law_1.2,0.7284736156463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,4,power_law_1.2,0.8736767768859863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,4,power_law_1.2,1.1366399765014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,4,power_law_1.2,1.0647551536560058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,4,power_law_1.2,1.1235136032104491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,4,power_law_1.2,1.1462656021118165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,4,power_law_1.2,1.0676223754882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,4,power_law_1.2,1.16428804397583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,4,power_law_1.2,1.1448320388793944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,4,power_law_1.2,1.2543999671936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,4,power_law_1.2,1.2206080436706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,4,power_law_1.2,1.2539775848388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,4,power_law_1.2,1.3049856185913087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,4,power_law_1.2,1.3168448448181151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,4,power_law_1.2,1.4501888275146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,4,power_law_1.2,1.5939264297485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,4,power_law_1.2,1.7254400253295898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,4,power_law_1.2,1.9779584884643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,4,power_law_1.2,2.3154687881469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,4,power_law_1.2,3.2739326477050783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,4,power_law_1.2,3.4607105255126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,4,power_law_1.2,5.006131362915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,4,power_law_1.2,6.014566421508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,1,power_law_1.01,0.10588159561157226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,1,power_law_1.01,0.16957440376281738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,1,power_law_1.01,0.26439039707183837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,1,power_law_1.01,0.4483071804046631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,1,power_law_1.01,0.4640768051147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,1,power_law_1.01,0.4646912097930908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,1,power_law_1.01,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,1,power_law_1.01,0.466534423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,1,power_law_1.01,0.4728831768035889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,1,power_law_1.01,0.48107519149780276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,1,power_law_1.01,0.4882368087768555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,1,power_law_1.01,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,1,power_law_1.01,0.49560961723327634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,1,power_law_1.01,0.49950718879699707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,1,power_law_1.01,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,1,power_law_1.01,0.5353472232818604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,1,power_law_1.01,0.5636096000671387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,1,power_law_1.01,0.662937593460083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,1,power_law_1.01,0.7741439819335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,1,power_law_1.01,0.940236759185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,1,power_law_1.01,1.2056575775146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,1,power_law_1.01,1.7166336059570313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,1,power_law_1.01,2.188902473449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,4,balanced,0.2730666597684224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,4,balanced,0.27153066794077557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,4,balanced,0.5246293147404989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,4,balanced,0.5295626719792684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,4,balanced,0.527018666267395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,4,balanced,0.5312853256861368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,4,balanced,0.5341866811116537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,4,balanced,0.5348693529764811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,4,balanced,0.5427146752675375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,4,balanced,0.5451093514760336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,4,balanced,0.5486933390299479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,4,balanced,0.5565439860026041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,4,balanced,0.5604693492253622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,4,balanced,0.567466656366984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,4,balanced,0.8065706888834635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,4,balanced,0.8417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,4,balanced,0.8289279937744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,4,balanced,1.0600106716156006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,4,balanced,1.1091626485188801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,4,balanced,1.4726826349894206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,4,balanced,1.5726933479309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,4,balanced,2.109951972961426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,4,balanced,2.594816048940023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,4,balanced,3.6601174672444663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,4,balanced,4.663978576660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,4,balanced,6.323370615641276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,4,balanced,7.8540802001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,1,power_law_1.01,3.3058815002441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,4,power_law_1.2,0.6098944187164307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,4,power_law_1.2,0.7839744091033936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,4,power_law_1.2,1.074176025390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,4,power_law_1.2,1.4004223823547364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,4,power_law_1.2,1.6668672561645508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,4,power_law_1.2,2.3541759490966796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,4,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,4,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,4,balanced,0.0718506673971812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,4,balanced,0.2739199995994568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,4,power_law_1.2,2.184185600280762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,4,balanced,0.5280426740646362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,4,balanced,0.777557373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,4,balanced,0.777557373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,4,balanced,0.7843733628590902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,4,power_law_1.2,2.41393928527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,4,balanced,0.7866026560465494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,4,balanced,0.7932586669921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,4,balanced,0.80076797803243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,4,power_law_1.2,2.4614912033081056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,4,balanced,0.8067413171132406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,4,balanced,0.8185173670450846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,4,balanced,0.8376266956329346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,4,balanced,0.8512852986653646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,4,power_law_1.2,2.4680448532104493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,4,balanced,0.8768853346506754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,4,balanced,0.9255253473917643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,4,balanced,0.9990826447804769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,4,power_law_1.2,2.688198471069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,4,balanced,1.108464002609253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,4,balanced,1.2380159695943196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,4,power_law_1.2,2.6269695281982424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,4,balanced,1.517738660176595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,4,balanced,1.8232320149739583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,4,power_law_1.2,2.7105279922485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,4,balanced,2.3951093355814614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,4,power_law_1.2,2.8475391387939455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,4,balanced,2.9458773930867515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,4,power_law_1.2,2.900377655029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,4,balanced,4.090197245279948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,4,power_law_1.2,2.9054975509643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,4,power_law_1.2,2.9734527587890627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,4,balanced,5.287071863810222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,4,power_law_1.2,3.132211112976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,4,power_law_1.2,3.3017856597900392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,4,power_law_1.2,3.6239166259765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,4,power_law_1.2,4.2448577880859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,4,power_law_1.2,5.068185424804687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,4,power_law_1.2,5.643059158325196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,4,power_law_1.2,7.204863739013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,4,power_law_1.2,9.504134368896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,4,power_law_1.2,12.869631958007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,1,power_law_1.01,4.376780700683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,1,power_law_1.01,6.376038360595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,1,balanced,0.43110398451487225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,1,balanced,0.815445343653361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,1,balanced,1.4272853533426921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,1,balanced,2.8025172551472983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,4,power_law_1.2,15.635865783691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,1,balanced,5.454506556193034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,1,balanced,8.03652254740397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,1,balanced,8.075775782267252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,1,balanced,8.111274719238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,1,balanced,8.147285461425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,1,balanced,8.181077321370443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,1,balanced,8.24337069193522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,1,balanced,8.303274790445963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,1,balanced,8.352426528930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,1,balanced,8.475135803222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,1,balanced,8.546304066975912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,1,power_law_1.01,8.507596588134765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,1,balanced,8.634368260701498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,1,balanced,8.805194854736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,1,balanced,9.165141423543295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,1,balanced,9.500672022501627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,1,balanced,10.423295974731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,1,balanced,10.590719858805338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,1,balanced,11.691349029541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,1,balanced,12.81228764851888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,1,balanced,15.195477803548178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,1,balanced,18.21491241455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,1,balanced,25.648297627766926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,1,balanced,32.90521494547526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,16,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,16,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,16,power_law_1.01,0.4157440185546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,16,power_law_1.01,0.3956415891647339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,16,power_law_1.01,0.4055039882659912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,16,power_law_1.01,0.4016128063201904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,16,power_law_1.01,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,16,power_law_1.01,0.34651520252227785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,16,power_law_1.01,0.3844095945358276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,16,power_law_1.01,0.33853440284729003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,16,power_law_1.01,0.35509119033813474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,16,power_law_1.01,0.389516806602478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,16,power_law_1.01,0.37826559543609617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,16,power_law_1.01,0.3782464027404785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,16,power_law_1.01,0.3827712059020996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,16,power_law_1.01,0.404863977432251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,16,power_law_1.01,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,16,power_law_1.01,0.4405248165130615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,16,power_law_1.01,0.502784013748169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,16,power_law_1.01,0.5128191947937012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,16,power_law_1.01,0.5937151908874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,16,power_law_1.01,0.7642943859100342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,16,power_law_1.01,0.9162752151489257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,16,power_law_1.01,1.2130240440368651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,16,power_law_1.01,1.6713727951049804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,16,power_law_1.01,2.2380416870117186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,16,power_law_1.01,2.893414306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,8,power_law_1.2,0.3176448106765747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,8,power_law_1.2,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,8,power_law_1.2,0.7518208026885986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,8,power_law_1.2,0.8284159660339355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,8,power_law_1.2,1.037279987335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,8,power_law_1.2,1.4014464378356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,8,power_law_1.2,1.4337984085083009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,8,power_law_1.2,1.461836814880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,8,power_law_1.2,1.3826047897338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,8,power_law_1.2,1.3813759803771972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,8,power_law_1.2,1.2691455841064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,8,power_law_1.2,1.3273088455200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,8,power_law_1.2,1.2339200019836425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,8,power_law_1.2,1.2822527885437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,8,power_law_1.2,1.319321632385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,8,power_law_1.2,1.3819904327392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,8,power_law_1.2,1.4411775588989257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,8,power_law_1.2,1.4979071617126465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,8,power_law_1.2,1.6279552459716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,8,power_law_1.2,1.801215934753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,8,power_law_1.2,1.8954240798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,4,balanced,0.0452159990866979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,4,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,8,power_law_1.2,2.2384639739990235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,8,power_law_1.2,2.6879999160766603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,4,balanced,0.2841599980990092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,4,balanced,0.5353813171386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,4,balanced,1.0373120307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,4,balanced,1.0419200261433919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,8,power_law_1.2,3.477094268798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,4,balanced,1.0333866278330486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,4,balanced,1.0390133062998455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,4,balanced,1.0410559972127278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,4,balanced,1.0490826765696208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,4,balanced,1.0576213200887044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,8,power_law_1.2,4.148223876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,4,balanced,1.0666666825612385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,4,balanced,1.0801493326822917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,4,balanced,1.0973866780598958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,4,balanced,1.1110400358835857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,4,balanced,1.1359573205312092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,4,balanced,1.1883520285288494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,4,balanced,1.2416000366210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,8,power_law_1.2,5.731123352050782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,4,balanced,1.3378559748331706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,4,balanced,1.4523733456929524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,4,balanced,1.6621227264404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,8,power_law_1.2,6.820658874511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,4,balanced,1.9177813529968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,4,balanced,2.433706601460775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,4,balanced,2.977450688680013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,4,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,4,power_law_1.01,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,4,balanced,4.121088027954102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,4,power_law_1.01,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,4,power_law_1.01,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,4,power_law_1.01,0.2799616098403931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,4,power_law_1.01,0.4296703815460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,4,balanced,5.335381189982097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,4,power_law_1.01,0.38010880947113035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,4,power_law_1.01,0.4190207958221436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,4,power_law_1.01,0.4167679786682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,4,power_law_1.01,0.4229119777679443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,4,power_law_1.01,0.4429823875427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,4,power_law_1.01,0.4607999801635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,4,power_law_1.01,0.4593664169311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,4,power_law_1.01,0.45055999755859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,4,power_law_1.01,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,4,power_law_1.01,0.4454400062561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,4,power_law_1.01,0.4759552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,4,power_law_1.01,0.48761601448059083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,4,power_law_1.01,0.5277696132659913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,4,power_law_1.01,0.5814271926879883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,4,power_law_1.01,0.7194623947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,4,power_law_1.01,0.911564826965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,4,power_law_1.01,0.9342975616455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,4,power_law_1.01,1.2883968353271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,4,power_law_1.01,1.7856512069702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,4,power_law_1.01,2.4424448013305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,4,power_law_1.01,3.2841728210449217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,16,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,16,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,16,balanced,0.030202666918436687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,16,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,16,balanced,0.1909760038057963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,16,balanced,0.2539520064989726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,16,balanced,0.25497599442799884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,16,balanced,0.2542933424313863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,16,balanced,0.25497599442799884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,16,balanced,0.2556533416112264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,16,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,16,balanced,0.25890133778254193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,16,balanced,0.2590720057487488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,16,balanced,0.2610879937807719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,16,balanced,0.26470400889714557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,16,balanced,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,16,balanced,0.2696533401807149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,16,balanced,0.2718399961789449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,16,balanced,0.2872320016225179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,16,balanced,0.2964479923248291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,16,balanced,0.3092479904492696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,16,balanced,0.33740798632303876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,16,balanced,0.3536213239034017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,16,balanced,0.40004265308380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,16,balanced,0.4538026650746663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,16,balanced,0.6485333442687988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,16,balanced,0.8280746936798096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,64,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,64,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,64,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,64,balanced,0.2583893338839213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,64,balanced,0.2991786599159241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,64,balanced,0.30054400364557904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,64,balanced,0.32409600416819256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,64,balanced,0.303274671236674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,64,balanced,0.3041279911994934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,64,balanced,0.30481066306432086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,64,balanced,0.3068586587905884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,64,balanced,0.31010133028030396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,64,balanced,0.3118079900741577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,64,balanced,0.3150506615638733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,64,balanced,0.3222186764081319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,64,balanced,0.32477867603302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,64,balanced,0.33587201436360675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,64,balanced,0.35174401601155597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,64,balanced,0.3628373146057129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,64,balanced,0.39133866628011066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,64,balanced,0.438101331392924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,64,balanced,0.5234346787134806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,64,balanced,0.5906773408253988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,64,balanced,0.6937599976857504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,64,balanced,0.8171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,64,balanced,1.1779413223266602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,64,balanced,1.519445260365804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,2,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,2,power_law_1.2,0.25661439895629884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,2,power_law_1.2,0.36636159420013426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,2,power_law_1.2,0.48660478591918943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,2,power_law_1.2,0.6330368041992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,2,power_law_1.2,1.1165696144104005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,2,power_law_1.2,1.1696127891540526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,2,power_law_1.2,1.2345343589782716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,2,power_law_1.2,1.267916774749756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,2,power_law_1.2,1.3178879737854003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,2,power_law_1.2,1.3129728317260743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,2,power_law_1.2,1.359462356567383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,2,power_law_1.2,1.4106623649597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,2,power_law_1.2,1.4610431671142579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,2,power_law_1.2,1.4866432189941405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,2,power_law_1.2,1.5400959968566894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,2,power_law_1.2,1.576959991455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,2,power_law_1.2,1.722368049621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,2,power_law_1.2,1.7954816818237305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,2,power_law_1.2,2.1188608169555665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,2,power_law_1.2,2.3062463760375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,2,power_law_1.2,2.8796928405761717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,2,power_law_1.2,3.4727935791015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,2,power_law_1.2,4.830412673950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,2,power_law_1.2,5.589401626586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,2,power_law_1.2,8.090419006347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,2,power_law_1.2,0.5988351821899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,2,power_law_1.2,1.0160127639770509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,2,power_law_1.2,1.4501888275146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,2,power_law_1.2,2.4293376922607424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,2,power_law_1.2,3.1324159622192385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,2,power_law_1.2,4.098233413696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,2,power_law_1.2,5.810176086425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,2,power_law_1.2,6.153420639038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,2,power_law_1.2,6.259507369995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,2,power_law_1.2,6.438502502441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,2,power_law_1.2,6.798745727539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,2,power_law_1.2,6.9261314392089846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,2,power_law_1.2,6.9650428771972654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,2,power_law_1.2,7.0991874694824215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,2,power_law_1.2,7.371161651611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,2,power_law_1.2,7.758233642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,2,power_law_1.2,7.85428466796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,2,power_law_1.2,8.047411346435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,2,power_law_1.2,8.361779022216798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,2,power_law_1.2,9.05318374633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,2,power_law_1.2,9.754009246826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,4,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,4,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,4,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,4,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,4,balanced,0.18090667327245077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,4,balanced,0.25975465774536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,4,balanced,0.2609440088272095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,4,balanced,0.26129066944122314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,4,balanced,0.2624853253364563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,4,balanced,0.26333866516749066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,4,balanced,0.26521599292755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,4,balanced,0.2662400007247925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,4,balanced,0.26828799645106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,4,balanced,0.27153066794077557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,4,balanced,0.2773333390553792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,4,balanced,0.28142400582631427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,4,balanced,0.28706133365631104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,4,balanced,0.29661866029103595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,4,balanced,0.3136853377024333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,4,balanced,0.33740798632303876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,4,balanced,0.36522666613260907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,4,balanced,0.41472001870473224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,4,balanced,0.4621653159459432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,2,power_law_1.2,10.743801879882813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,4,balanced,0.5896533330281576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,4,balanced,0.749397357304891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,4,balanced,1.1142826875050862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,4,balanced,1.5232000350952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,2,power_law_1.2,12.404121398925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,2,power_law_1.2,15.44847412109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,2,power_law_1.2,18.29375305175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,2,power_law_1.2,11.200307464599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,2,power_law_1.2,23.396556091308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,2,power_law_1.2,28.520242309570314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,8,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,8,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,8,power_law_1.2,0.04156160056591034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,8,power_law_1.2,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,8,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,8,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,8,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,8,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,8,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,8,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,8,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,8,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,8,power_law_1.2,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,8,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,8,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,8,power_law_1.2,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,8,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,8,power_law_1.2,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,8,power_law_1.2,0.15032320022583007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,8,power_law_1.2,0.22282240390777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,8,power_law_1.2,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,8,power_law_1.2,0.37867519855499265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,8,power_law_1.2,0.5836800098419189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,8,power_law_1.2,0.8427519798278809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,8,power_law_1.2,1.2476415634155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,8,power_law_1.2,1.8405248641967773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,32,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,32,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,32,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,32,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,32,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,32,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,32,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,32,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,32,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,32,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,32,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,32,balanced,0.06348800162474315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,32,balanced,0.06553600231806438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,32,balanced,0.08004266520341237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,32,balanced,0.0766293356815974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,32,balanced,0.11895466844240825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,32,balanced,0.21026132504145303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,32,balanced,0.23125332593917847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,32,balanced,0.27477333943049115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,32,balanced,0.3145386576652527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,32,balanced,0.40004265308380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,32,balanced,0.43775999546051025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,32,balanced,0.5505706469217936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,32,balanced,0.7091200351715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,32,balanced,1.0907306671142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,32,balanced,1.4337706565856934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,2,power_law_1.01,0.4059135913848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,2,power_law_1.01,0.7612287998199463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,2,power_law_1.01,1.0059519767761231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,2,power_law_1.01,1.577779197692871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,2,power_law_1.01,2.063155174255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,2,power_law_1.01,3.23768310546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,2,power_law_1.01,3.227648162841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,2,power_law_1.01,3.493888092041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,2,power_law_1.01,3.68353271484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,2,power_law_1.01,3.7302272796630858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,2,power_law_1.01,3.652608108520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,2,power_law_1.01,3.7988353729248048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,2,power_law_1.01,3.842252731323242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,2,power_law_1.01,4.034150314331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,2,power_law_1.01,4.102348709106446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,2,power_law_1.01,4.157235336303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,2,power_law_1.01,4.316569519042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,2,power_law_1.01,4.481843185424805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,2,power_law_1.01,4.729651260375976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,2,power_law_1.01,5.192895889282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,2,power_law_1.01,5.677875137329101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,2,power_law_1.01,6.985932922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,2,power_law_1.01,7.445708465576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,2,power_law_1.01,9.647103881835937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,2,power_law_1.01,11.375411224365234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,2,power_law_1.01,15.65982666015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,2,power_law_1.01,19.90758361816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,8,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,8,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,8,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,8,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,8,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,8,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,8,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,8,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,8,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,8,power_law_1.2,0.03992320001125336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,8,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,8,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,8,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,8,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,8,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,8,power_law_1.2,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,8,power_law_1.2,0.08663039803504943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,8,power_law_1.2,0.12615679502487182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,8,power_law_1.2,0.19435520172119142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,8,power_law_1.2,0.2381824016571045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,8,power_law_1.2,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,8,power_law_1.2,0.3737600088119507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,8,power_law_1.2,0.5355519771575927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,8,power_law_1.2,0.7024640083312989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,8,power_law_1.2,1.292902374267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,32,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,32,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,32,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,32,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,32,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,32,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,32,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,32,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,32,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,8,power_law_1.2,1.6304128646850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,32,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,32,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,32,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,32,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,32,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,32,power_law_1.01,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,32,power_law_1.01,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,32,power_law_1.01,0.0997376024723053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,32,power_law_1.01,0.1316864013671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,32,power_law_1.01,0.17428480386734008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,32,power_law_1.01,0.2447360038757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,32,power_law_1.01,0.27299840450286866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,32,power_law_1.01,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,32,power_law_1.01,0.5064640045166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,32,power_law_1.01,0.7790592193603516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,32,power_law_1.01,1.1290623664855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,32,power_law_1.01,1.7756160736083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,32,power_law_1.01,2.322431945800781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,4,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,4,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,4,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,4,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,4,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,4,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,4,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,4,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,4,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,4,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,4,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,4,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,4,power_law_1.2,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,4,power_law_1.2,0.09605119824409485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,4,power_law_1.2,0.12819839715957643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,4,power_law_1.2,0.12431360483169555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,4,power_law_1.2,0.15994880199432374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,4,power_law_1.2,0.22814719676971434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,8,power_law_1.2,0.7530496120452881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,8,power_law_1.2,1.0973183631896972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,8,power_law_1.2,1.2281855583190917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,4,power_law_1.2,0.31703040599822996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,8,power_law_1.2,1.619353675842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,8,power_law_1.2,1.760870361328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,8,power_law_1.2,1.825587272644043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,2,power_law_1.01,0.5949440002441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,2,power_law_1.01,1.0442560195922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,8,power_law_1.2,1.9218431472778321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,4,power_law_1.2,0.4567039966583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,8,power_law_1.2,1.8448383331298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,2,power_law_1.01,2.0338687896728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,8,power_law_1.2,1.816985511779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,2,power_law_1.01,2.7617279052734376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,8,power_law_1.2,1.9058687210083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,8,power_law_1.2,1.9372032165527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,2,power_law_1.01,4.536524963378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,4,power_law_1.2,0.5861375808715821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,8,power_law_1.2,2.0074495315551757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,8,power_law_1.2,2.0148223876953124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,2,power_law_1.01,5.152972793579101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,8,power_law_1.2,2.085887908935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,8,power_law_1.2,2.035686492919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,8,power_law_1.2,2.1856256484985352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,2,power_law_1.01,6.867967987060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,8,power_law_1.2,2.1161983489990233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,4,power_law_1.2,0.8278016090393067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,8,power_law_1.2,2.2994943618774415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,2,power_law_1.01,8.707660675048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,8,power_law_1.2,2.412339210510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,8,power_law_1.2,2.6976255416870116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,4,power_law_1.2,1.1304960250854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,2,power_law_1.01,8.917401885986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,8,power_law_1.2,2.9855743408203126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,8,power_law_1.2,3.863961410522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,2,power_law_1.01,9.104793548583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,8,power_law_1.2,4.139622497558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,8,power_law_1.2,4.948172760009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,2,power_law_1.01,9.094963073730469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,8,power_law_1.2,6.731980895996093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,2,power_law_1.01,9.535897827148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,8,power_law_1.2,9.268428802490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,2,power_law_1.01,9.730860900878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,2,power_law_1.01,9.726150512695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,2,power_law_1.01,10.237747192382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,2,power_law_1.01,10.184089660644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,8,power_law_1.2,11.463648223876953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,2,power_law_1.01,10.711039733886718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,2,power_law_1.01,11.830271911621093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,4,power_law_1.2,1.908940887451172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,2,power_law_1.01,11.781734466552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,2,power_law_1.01,12.408013153076173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,2,power_law_1.01,13.208781433105468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,2,power_law_1.01,13.681050109863282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,2,power_law_1.01,15.923782348632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,2,power_law_1.01,18.588223266601563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,4,power_law_1.2,2.6269695281982424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,2,power_law_1.01,21.604966735839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,2,power_law_1.01,28.08647766113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,2,power_law_1.01,28.31523742675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,1,power_law_1.2,1.1143168449401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,1,power_law_1.2,2.0477951049804686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,1,power_law_1.2,4.126515197753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,1,power_law_1.2,7.559782409667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,1,power_law_1.2,10.624614715576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,1,power_law_1.2,14.785722351074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,4,power_law_1.2,3.5360767364501955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,1,power_law_1.2,22.054092407226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,1,power_law_1.2,23.855923461914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,1,balanced,0.3128160039583842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,1,balanced,0.5360639890034994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,1,balanced,1.031167984008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,1,balanced,2.0249600410461426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,1,balanced,4.088831901550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,1,balanced,7.91978645324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,1,power_law_1.2,24.268595886230468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,1,balanced,7.946581522623698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,1,balanced,7.971471786499023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,1,balanced,7.994026819864909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,1,balanced,8.01689592997233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,1,power_law_1.2,24.64849853515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,1,balanced,8.055295944213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,1,balanced,8.099141438802084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,1,balanced,8.132437388102213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,1,balanced,8.200192133585611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,1,power_law_1.2,25.74622802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,1,balanced,8.26589838663737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,1,balanced,8.324437459309896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,1,balanced,8.447317123413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,1,balanced,8.65723737080892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,1,power_law_1.2,27.29697265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,1,balanced,8.876373291015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,1,balanced,9.287850697835287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,1,balanced,10.025290807088217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,1,power_law_1.2,27.49378662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,1,balanced,10.723157246907553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,1,balanced,11.190272013346354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,1,balanced,12.638890584309896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,1,power_law_1.2,28.415179443359374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,1,balanced,14.352383931477865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,4,power_law_1.2,4.758323287963867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,1,balanced,19.361104329427082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,1,power_law_1.2,29.724465942382814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,1,balanced,23.594324747721355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,1,power_law_1.2,30.720819091796876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,1,power_law_1.2,31.92545166015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,1,power_law_1.2,34.077081298828126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,1,power_law_1.2,35.253240966796874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,1,power_law_1.2,37.650637817382815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,1,power_law_1.2,40.148580932617186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,1,power_law_1.2,41.69584655761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,1,power_law_1.2,52.053399658203126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,1,power_law_1.2,65.10427856445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,1,power_law_1.2,72.91514892578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,8,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,8,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,8,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,8,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,8,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,8,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,8,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,8,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,8,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,8,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,8,balanced,0.0730453332265218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,8,balanced,0.07796800136566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,8,balanced,0.11622400085131328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,8,balanced,0.1384106675783793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,8,balanced,0.14506666858990988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,8,balanced,0.19404800732930502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,8,balanced,0.2295466661453247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,8,balanced,0.2638293306032817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,8,balanced,0.31214932600657147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,8,balanced,0.37307735284169513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,8,balanced,0.4768426815668742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,8,balanced,0.6217386722564697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,8,balanced,0.9845759868621826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,8,balanced,1.3830827077229817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,8,balanced,2.121386686960856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,8,balanced,2.8136107126871743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,32,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,32,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,32,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,32,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,32,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,32,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,32,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,32,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,32,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,32,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,32,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,32,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,32,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,32,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,1,power_law_1.2,92.71419067382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,32,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,32,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,32,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,32,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,32,power_law_1.01,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,32,power_law_1.01,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,32,power_law_1.01,0.1347584009170532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,32,power_law_1.01,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,32,power_law_1.01,0.2977792024612427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,32,power_law_1.01,0.4395008087158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,32,power_law_1.01,0.6590464115142822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,1,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,1,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,1,power_law_1.2,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,1,power_law_1.2,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,1,power_law_1.2,0.4241343975067139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,1,power_law_1.2,0.7223296165466309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,1,power_law_1.2,0.7780352115631104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,1,power_law_1.2,0.7979008197784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,1,power_law_1.2,0.8497152328491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,1,power_law_1.2,0.8388607978820801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,1,power_law_1.2,0.8988672256469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,1,power_law_1.2,0.921996784210205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,1,power_law_1.2,0.9224191665649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,1,power_law_1.2,0.9500672340393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,1,power_law_1.2,0.9742336273193359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,1,power_law_1.2,0.9805824279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,1,power_law_1.2,1.0213376045227052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,1,power_law_1.2,1.0676223754882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,1,power_law_1.2,1.1601920127868652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,1,power_law_1.2,1.3000703811645509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,1,power_law_1.2,1.4682111740112305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,1,power_law_1.2,1.7825599670410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,1,power_law_1.2,2.028134346008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,1,power_law_1.2,2.6124288558959963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,1,power_law_1.2,93.31077270507812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,1,power_law_1.2,3.24505615234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,1,power_law_1.2,4.576460647583008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,2,power_law_1.01,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,2,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,2,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,2,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,2,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,2,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,2,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,2,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,2,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,2,power_law_1.01,0.06242560148239136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,2,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,2,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,2,power_law_1.01,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,2,power_law_1.01,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,2,power_law_1.01,0.1060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,2,power_law_1.01,0.10792959928512573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,2,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,2,power_law_1.01,0.20478720664978028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,2,power_law_1.01,0.29552640914916994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,2,power_law_1.01,0.3719167947769165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,2,power_law_1.01,0.37969920635223386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,2,power_law_1.01,0.6260735988616943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,2,power_law_1.01,0.9156607627868653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,1,power_law_1.2,5.724774551391602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,2,power_law_1.01,1.20381441116333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,2,power_law_1.01,1.7280895233154296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,4,power_law_1.2,0.5822463989257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,4,power_law_1.2,1.0119168281555175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,4,power_law_1.2,1.23822078704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,4,power_law_1.2,1.8085887908935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,4,power_law_1.2,1.9597312927246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,4,power_law_1.2,3.213926315307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,4,power_law_1.2,3.7388160705566404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,4,power_law_1.2,3.4754558563232423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,4,power_law_1.2,3.35810546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,4,power_law_1.2,3.236454391479492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,4,power_law_1.2,3.4148353576660155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,4,power_law_1.2,3.5094528198242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,4,power_law_1.2,3.5506175994873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,4,power_law_1.2,3.666944122314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,2,power_law_1.01,2.417868804931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,4,power_law_1.2,3.7201919555664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,4,power_law_1.2,3.783065414428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,4,power_law_1.2,4.028620910644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,4,power_law_1.2,4.219084930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,4,power_law_1.2,4.440268707275391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,4,power_law_1.2,4.515430450439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,4,power_law_1.2,5.061017608642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,4,power_law_1.2,5.325791931152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,4,power_law_1.2,6.311731338500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,4,power_law_1.2,8.718508911132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,4,power_law_1.2,9.874432373046876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,2,power_law_1.01,3.432012939453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,4,power_law_1.2,16.063487243652343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,4,power_law_1.2,17.1831298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.28917760848999025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.5332863807678223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.9332736015319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,1,power_law_1.01,1.3221887588500976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,1,power_law_1.01,1.5634431838989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,1,power_law_1.01,2.031820869445801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,1,power_law_1.01,2.1602304458618162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,1,power_law_1.01,2.1794815063476562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,1,power_law_1.01,2.3597055435180665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,1,power_law_1.01,2.3969791412353514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,1,power_law_1.01,2.5212543487548826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,1,power_law_1.01,2.6001407623291017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,1,power_law_1.01,2.7215871810913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,1,power_law_1.01,2.81845760345459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,1,power_law_1.01,2.9601791381835936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,1,power_law_1.01,3.289702224731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,1,power_law_1.01,3.5106815338134765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,1,power_law_1.01,3.988479995727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,1,power_law_1.01,4.479155349731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,1,power_law_1.01,5.4597633361816404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,1,power_law_1.01,6.343475341796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,2,power_law_1.2,0.597811222076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,2,power_law_1.2,0.8505344390869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,2,power_law_1.2,1.3701120376586915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,1,power_law_1.01,8.281906890869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,2,power_law_1.2,2.0967424392700194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,2,power_law_1.2,2.654617691040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,2,power_law_1.2,4.215193557739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,1,power_law_1.01,10.165452575683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,2,power_law_1.2,4.504576110839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,2,power_law_1.2,4.504371261596679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,2,power_law_1.2,4.848640060424804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,1,power_law_1.01,14.076109313964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,2,power_law_1.2,5.1169281005859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,2,power_law_1.2,5.201919937133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,2,power_law_1.2,5.1324928283691404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,1,power_law_1.01,17.78401336669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,2,power_law_1.2,5.30513916015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,2,power_law_1.2,5.586739349365234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,2,power_law_1.2,5.577318572998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,2,power_law_1.2,5.729280090332031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,2,power_law_1.2,5.895577621459961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,2,power_law_1.2,6.188633728027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,2,power_law_1.2,6.248038482666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,2,power_law_1.2,6.791776275634765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,2,power_law_1.2,7.857561492919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,2,power_law_1.2,9.725132751464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,2,power_law_1.2,10.033152008056641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,2,power_law_1.2,12.455526733398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,8,power_law_1.2,0.3411967992782593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,8,power_law_1.2,0.3727360010147095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,8,power_law_1.2,0.5134335994720459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,8,power_law_1.2,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,8,power_law_1.2,0.6330368041992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,8,power_law_1.2,0.6594560146331787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,8,power_law_1.2,0.6774784088134765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,2,power_law_1.2,15.470790100097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,8,power_law_1.2,0.6789120197296142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,8,power_law_1.2,0.6936575889587402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,8,power_law_1.2,0.6969344139099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,8,power_law_1.2,0.7213056087493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,8,power_law_1.2,0.7260159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,8,power_law_1.2,0.6813695907592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,8,power_law_1.2,0.7288832187652587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,8,power_law_1.2,0.7634943962097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,8,power_law_1.2,0.7929855823516846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,8,power_law_1.2,0.8339455604553223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,8,power_law_1.2,0.8615936279296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,8,power_law_1.2,0.9349120140075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,8,power_law_1.2,1.101414394378662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,8,power_law_1.2,1.3668288230895995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,8,power_law_1.2,1.7049600601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,8,power_law_1.2,2.2931455612182616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,8,power_law_1.2,3.1660032272338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,8,power_law_1.2,3.196518325805664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,2,power_law_1.2,20.554547119140626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,8,power_law_1.2,4.781875228881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,8,power_law_1.2,6.1806591033935545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,2,power_law_1.2,26.456875610351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,64,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,64,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,64,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,64,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,64,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,64,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,64,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,64,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,64,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,64,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,64,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,64,power_law_1.2,0.07003520131111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,64,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,64,power_law_1.2,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,64,power_law_1.2,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,64,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,64,power_law_1.2,0.10464639663696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,64,power_law_1.2,0.15851520299911498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,64,power_law_1.2,0.21626880168914794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,64,power_law_1.2,0.2777087926864624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,64,power_law_1.2,0.34713599681854246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,64,power_law_1.2,0.5119999885559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,64,power_law_1.2,0.8380415916442872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,64,power_law_1.2,1.3209600448608398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,64,power_law_1.2,1.531494426727295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,64,power_law_1.2,2.532966423034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,64,power_law_1.2,4.02350082397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,8,balanced,0.27409066756566364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,8,balanced,0.24422399202982584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,8,balanced,0.24473599592844644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,8,balanced,0.24490666389465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,8,balanced,0.24744532505671182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,8,balanced,0.2491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,8,balanced,0.250709335009257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,8,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,8,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,8,balanced,0.25497599442799884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,8,balanced,0.2529279987017314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,8,balanced,0.25547200441360474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,8,balanced,0.2582079966862996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,8,balanced,0.26897066831588745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,8,balanced,0.2783573269844055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,8,balanced,0.28296534220377606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,8,balanced,0.2986666758855184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,8,balanced,0.3577173153559367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,8,balanced,0.4135040044784546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,8,balanced,0.582314650217692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,8,balanced,0.7176533540089926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,16,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,16,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,8,balanced,0.9970293045043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,16,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,16,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,16,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,16,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,16,balanced,0.0283146674434344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,16,balanced,0.02847466617822647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,8,balanced,1.260543982187907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,16,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,16,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,16,balanced,0.030026666820049286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,16,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,16,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,8,balanced,1.7757867177327473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,16,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,16,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,16,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,16,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,8,balanced,2.2817866007486978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,16,balanced,0.09915733337402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,16,balanced,0.21009065707524618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,16,balanced,0.3199999928474426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,16,balanced,0.4509013493855794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,8,balanced,3.3779945373535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,16,balanced,0.702122688293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,16,balanced,0.9528319835662842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,8,balanced,4.488874753316243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,16,power_law_1.2,0.471449613571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,16,power_law_1.2,0.42803201675415037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,16,power_law_1.2,0.40385918617248534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,16,power_law_1.2,0.45711359977722166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,16,power_law_1.2,0.33566720485687257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,16,power_law_1.2,0.4093952178955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,16,power_law_1.2,0.46100478172302245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,16,power_law_1.2,0.4423679828643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,16,power_law_1.2,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,16,power_law_1.2,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,16,power_law_1.2,0.47575039863586427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,16,power_law_1.2,0.4773888111114502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,16,power_law_1.2,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,16,power_law_1.2,0.4739071846008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,16,power_law_1.2,0.5029888153076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,16,power_law_1.2,0.505024003982544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,16,power_law_1.2,0.5271552085876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,16,power_law_1.2,0.6199295997619629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,16,power_law_1.2,0.7278592109680175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,16,power_law_1.2,0.8232959747314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,16,power_law_1.2,1.0463232040405273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,16,power_law_1.2,1.4245887756347657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,4,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,16,power_law_1.2,1.7485824584960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,4,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,4,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,4,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,4,balanced,0.2846720019976298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,4,balanced,0.5398186842600504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,4,balanced,0.7927467028299967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,4,balanced,0.7869439919789633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,4,balanced,0.788821299870809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,4,balanced,0.7910400231679281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,4,balanced,0.7976799805959066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,4,balanced,0.8070826530456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,4,balanced,0.8135680357615153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,4,balanced,0.8280746936798096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,4,balanced,0.841386636098226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,4,balanced,0.8550399939219157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,4,balanced,0.884394645690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,4,balanced,0.959658702214559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,4,balanced,0.9861120382944742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,4,balanced,1.0862932999928792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,4,balanced,1.1847679615020752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,4,balanced,1.41704527537028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,4,balanced,1.6529067357381184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,16,power_law_1.2,2.5530368804931642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,4,balanced,2.1736106872558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,4,balanced,2.7265707651774087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,4,balanced,3.8463147481282554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,4,balanced,4.928000132242839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,16,power_law_1.2,3.2266239166259765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,16,power_law_1.2,4.257382583618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,16,power_law_1.2,6.343059158325195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,32,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,32,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,32,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,32,power_law_1.01,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,32,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,32,power_law_1.01,0.037062400579452516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,32,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,32,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,32,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,32,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,32,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,32,power_law_1.01,0.04524799883365631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,32,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,32,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,32,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,32,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,32,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,32,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,32,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,32,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,32,power_law_1.01,0.10895359516143799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,32,power_law_1.01,0.13352960348129272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,32,power_law_1.01,0.1802240014076233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,32,power_law_1.01,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,32,power_law_1.01,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,32,power_law_1.01,0.643071985244751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,32,power_law_1.01,0.9316351890563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,4,power_law_1.01,0.47226881980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,4,power_law_1.01,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,4,power_law_1.01,0.8204287528991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,4,power_law_1.01,0.9127936363220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,4,power_law_1.01,0.9125887870788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,4,power_law_1.01,0.9297663688659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,4,power_law_1.01,0.9474047660827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,4,power_law_1.01,1.1822976112365722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,4,power_law_1.01,1.4264320373535155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,4,power_law_1.01,1.4049280166625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,4,power_law_1.01,1.2699647903442384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,4,power_law_1.01,1.368678379058838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,4,power_law_1.01,1.5894528388977052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,4,power_law_1.01,1.8917247772216796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,4,power_law_1.01,2.1452800750732424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,2,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,2,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,4,power_law_1.01,2.372403144836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,2,power_law_1.2,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,2,power_law_1.2,0.156876802444458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,2,power_law_1.2,0.21810560226440429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,2,power_law_1.2,0.40366082191467284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,2,power_law_1.2,0.4034560203552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,4,power_law_1.01,3.2308990478515627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,2,power_law_1.2,0.42598400115966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,2,power_law_1.2,0.43438081741333007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,2,power_law_1.2,0.42229762077331545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,2,power_law_1.2,0.4661248207092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,2,power_law_1.2,0.45998082160949705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,4,power_law_1.01,4.103782272338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,2,power_law_1.2,0.46776318550109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,2,power_law_1.2,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,2,power_law_1.2,0.4851712226867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,2,power_law_1.2,0.48148479461669924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,2,power_law_1.2,0.4986879825592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,2,power_law_1.2,0.5167103767395019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,2,power_law_1.2,0.5652480125427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,2,power_law_1.2,0.6352896213531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,2,power_law_1.2,0.7256063938140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,2,power_law_1.2,0.8945664405822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,2,power_law_1.2,1.112268829345703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,4,power_law_1.01,5.156659317016602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,2,power_law_1.2,1.5163392066955566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,4,power_law_1.01,6.0293121337890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,4,power_law_1.01,7.320575714111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,2,power_law_1.2,2.0357120513916014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,4,power_law_1.01,8.315084838867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,4,power_law_1.01,10.906009674072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,16,power_law_1.01,1.0766207695007324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,16,power_law_1.01,2.066431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,16,power_law_1.01,3.0724096298217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,16,power_law_1.01,2.949939155578613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,16,power_law_1.01,3.076915168762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,16,power_law_1.01,3.0539775848388673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,16,power_law_1.01,2.4557567596435548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,16,power_law_1.01,2.462105560302734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,16,power_law_1.01,2.4168447494506835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,16,power_law_1.01,2.267955207824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,16,power_law_1.01,2.5644927978515626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,16,power_law_1.01,2.4614912033081056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,16,power_law_1.01,2.8006399154663084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,16,power_law_1.01,2.4340415954589845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,16,power_law_1.01,2.814156723022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,16,power_law_1.01,2.9087743759155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,16,power_law_1.01,2.772172737121582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,2,power_law_1.2,2.639257621765137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,16,power_law_1.01,2.935603141784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,16,power_law_1.01,3.2071678161621096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,16,power_law_1.01,3.3851390838623048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,16,power_law_1.01,3.596083068847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,16,power_law_1.01,4.077561569213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,4,power_law_1.01,15.059552001953126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,16,power_law_1.01,4.285235214233398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,16,power_law_1.01,5.571174240112304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,16,power_law_1.01,6.951116943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,16,power_law_1.01,10.313932800292969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,16,power_law_1.01,9.923379516601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,2,power_law_1.2,3.9315326690673826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,4,power_law_1.01,18.09899444580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,2,power_law_1.01,0.34652159214019773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,2,power_law_1.01,0.5584896087646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,2,power_law_1.01,0.7370751857757568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,2,power_law_1.01,1.1560959815979004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,4,power_law_1.01,23.013343811035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,2,power_law_1.01,1.4602239608764649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,2,power_law_1.01,2.2513664245605467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,2,power_law_1.01,2.2405120849609377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,2,power_law_1.01,2.381823921203613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,2,power_law_1.01,2.383027267456055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,2,power_law_1.01,2.478079986572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,2,power_law_1.01,2.5473024368286135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,2,power_law_1.01,2.5432064056396486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,2,power_law_1.01,2.6028032302856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,2,power_law_1.01,2.7097087860107423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,2,power_law_1.01,2.712166404724121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,2,power_law_1.01,2.7009023666381835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,2,power_law_1.01,2.791833686828613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,2,power_law_1.01,2.979430389404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,2,power_law_1.01,3.113983917236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,2,power_law_1.01,3.303424072265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,2,power_law_1.01,3.5749889373779298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,2,power_law_1.01,4.457267379760742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,2,power_law_1.01,5.0597888946533205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,2,power_law_1.01,6.48437728881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,2,power_law_1.01,7.515135955810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,2,power_law_1.01,10.978508758544923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,2,power_law_1.01,14.06341094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,4,power_law_1.01,27.46900329589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,8,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,8,balanced,0.306005338827769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,8,balanced,0.5911893447240194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,8,balanced,1.118890682856242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,8,balanced,1.4062933921813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,8,balanced,1.4102187156677246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,8,balanced,1.3887146313985188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,8,balanced,1.3934933344523113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,8,balanced,1.3960533142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,8,balanced,1.4039039611816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,8,balanced,1.4105440775553386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,8,balanced,1.4161920547485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,8,balanced,1.4291626612345378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,8,balanced,1.439893404642741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,8,balanced,1.4849707285563152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,8,balanced,1.510229269663493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,8,balanced,1.545728047688802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,8,balanced,1.5737172762552898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,8,balanced,1.71997865041097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,8,balanced,1.661952018737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,8,balanced,1.8334719340006511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,8,balanced,2.0019200642903647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,8,balanced,2.406229337056478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,8,balanced,3.0446933110555015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,8,balanced,4.222805341084798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,8,balanced,5.529578526814778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,32,power_law_1.2,0.5980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,32,power_law_1.2,0.5470208168029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,32,power_law_1.2,0.5492735862731933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,32,power_law_1.2,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,32,power_law_1.2,0.49213438034057616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,32,power_law_1.2,0.4220928192138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,32,power_law_1.2,0.5132287979125977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,32,power_law_1.2,0.4734975814819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,32,power_law_1.2,0.5013504028320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,32,power_law_1.2,0.4775807857513428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,32,power_law_1.2,0.5087232112884521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,32,power_law_1.2,0.5122047901153565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,32,power_law_1.2,0.550707197189331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,32,power_law_1.2,0.5033984184265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,32,power_law_1.2,0.5517312049865722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,32,power_law_1.2,0.5353472232818604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,32,power_law_1.2,0.5955584049224854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,32,power_law_1.2,0.6135615825653076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,32,power_law_1.2,0.6928383827209472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,32,power_law_1.2,0.7915520191192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,32,power_law_1.2,0.9021439552307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,32,power_law_1.2,1.2908543586730956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,32,power_law_1.2,1.693894386291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,32,power_law_1.2,2.24768009185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,32,power_law_1.2,2.8833791732788088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,32,power_law_1.2,4.298137664794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,32,power_law_1.2,5.610086441040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,2,power_law_1.01,0.1931264042854309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,2,power_law_1.01,0.32522239685058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,2,power_law_1.01,0.4272128105163574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,2,power_law_1.01,0.8146944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,2,power_law_1.01,0.881049633026123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,2,power_law_1.01,1.457356834411621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,2,power_law_1.01,1.5202303886413575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,2,power_law_1.01,1.5994879722595214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,2,power_law_1.01,1.6902143478393554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,2,power_law_1.01,1.5550463676452637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,2,power_law_1.01,1.6840511322021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,2,power_law_1.01,1.7537023544311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,2,power_law_1.01,1.7719295501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,2,power_law_1.01,1.7872896194458008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,2,power_law_1.01,1.8077695846557618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,2,power_law_1.01,1.8249727249145509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,2,power_law_1.01,1.8886655807495116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,2,power_law_1.01,1.9711999893188477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,2,power_law_1.01,1.9904512405395507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,2,power_law_1.01,2.0764671325683595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,2,power_law_1.01,2.342502403259277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,2,power_law_1.01,2.8651519775390626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,2,power_law_1.01,2.91778564453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,2,power_law_1.01,3.8035457611083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,2,power_law_1.01,4.294041442871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,2,power_law_1.01,5.686681747436523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,2,power_law_1.01,7.2087554931640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,4,power_law_1.01,0.324403190612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,4,power_law_1.01,0.5455872058868408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,4,power_law_1.01,1.04017915725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,4,power_law_1.01,1.0289152145385743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,4,power_law_1.01,1.5765503883361816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,4,power_law_1.01,1.8110464096069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,4,power_law_1.01,1.6541696548461915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,4,power_law_1.01,2.4596479415893553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,4,power_law_1.01,2.5692159652709963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,4,power_law_1.01,2.5649152755737306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,4,power_law_1.01,2.205286407470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,4,power_law_1.01,2.5274368286132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,4,power_law_1.01,2.6030080795288084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,4,power_law_1.01,2.713190460205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,4,power_law_1.01,2.660147285461426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,4,power_law_1.01,2.675904083251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,4,power_law_1.01,2.705407905578613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,4,power_law_1.01,2.867404747009277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,4,power_law_1.01,2.976563262939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,4,power_law_1.01,3.1627199172973635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,4,power_law_1.01,3.298099136352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,4,power_law_1.01,3.6519935607910154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,4,power_law_1.01,4.201267242431641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,4,power_law_1.01,5.055487823486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,4,power_law_1.01,5.852979278564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,4,power_law_1.01,7.753932952880859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,4,power_law_1.01,9.426739501953126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,64,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,64,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,64,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,64,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,64,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,64,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,64,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,64,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,64,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,64,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,64,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,64,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,64,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,64,balanced,0.04436799883842468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,64,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,64,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,64,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,64,balanced,0.07116266588370006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,64,balanced,0.1397760013739268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,64,balanced,0.20036266247431436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,64,balanced,0.343722661336263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,64,balanced,0.4275199969609578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,128,power_law_1.01,0.05303679704666138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,128,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,128,power_law_1.01,0.05260800123214722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,128,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,128,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,128,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,128,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,128,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,128,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,128,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,128,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,128,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,128,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,128,power_law_1.01,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,128,power_law_1.01,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,128,power_law_1.01,0.11919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,128,power_law_1.01,0.18288639783859253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,128,power_law_1.01,0.2207360029220581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,128,power_law_1.01,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,128,power_law_1.01,0.33749120235443114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,128,power_law_1.01,0.36761600971221925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,128,power_law_1.01,0.496230411529541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,128,power_law_1.01,0.6359039783477783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,128,power_law_1.01,0.953548812866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,128,power_law_1.01,1.3961215972900392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,128,power_law_1.01,2.1766143798828126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,128,power_law_1.01,3.001958465576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,16,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,16,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,16,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,16,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,16,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,16,balanced,0.0496373325586319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,16,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,16,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,16,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,16,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,16,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,16,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,16,balanced,0.057333335280418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,16,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,16,balanced,0.06348800162474315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,16,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,16,balanced,0.07423999905586243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,16,balanced,0.11876799662907918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,16,balanced,0.19949867328008017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,16,balanced,0.2510293324788411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,16,balanced,0.30054400364557904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,16,balanced,0.3949226538340251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,16,balanced,0.49749334653218585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,16,balanced,0.7447893619537354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,16,balanced,0.9954986572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,16,balanced,1.508010705312093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,16,balanced,2.054314613342285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,2,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,2,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,2,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,2,power_law_1.01,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,2,power_law_1.01,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,2,power_law_1.01,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,2,power_law_1.01,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,2,power_law_1.01,0.32071681022644044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,2,power_law_1.01,0.3469311952590942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,2,power_law_1.01,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,2,power_law_1.01,0.35983359813690186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,2,power_law_1.01,0.3780607938766479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,2,power_law_1.01,0.38092799186706544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,2,power_law_1.01,0.3985408067703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,2,power_law_1.01,0.4315135955810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,2,power_law_1.01,0.44748802185058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,2,power_law_1.01,0.48865280151367185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,2,power_law_1.01,0.5687295913696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,2,power_law_1.01,0.643071985244751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,2,power_law_1.01,0.8427519798278809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,2,power_law_1.01,1.0668031692504882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,2,power_law_1.01,1.477836799621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,2,power_law_1.01,1.906483268737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,2,power_law_1.01,2.741043281555176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,2,power_law_1.01,3.554099273681641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,2,power_law_1.01,5.18922233581543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,2,power_law_1.01,7.499980926513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,4,balanced,0.027466667195161183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,4,balanced,0.02831999957561493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,4,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,4,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,4,balanced,0.24574400981267294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,4,balanced,0.2481493353843689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,4,balanced,0.2500266631444295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,4,balanced,0.25173334280649823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,4,balanced,0.2529279987017314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,4,balanced,0.25446399052937824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,4,balanced,0.25702399015426636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,4,balanced,0.2629973292350769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,4,balanced,0.26470400889714557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,4,balanced,0.27084799607594806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,4,balanced,0.27801599105199176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,4,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,4,balanced,0.2974613308906555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,4,balanced,0.3232426643371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,4,balanced,0.3326293428738912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,4,balanced,0.373418649037679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,4,balanced,0.411135991414388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,4,balanced,0.5085866848627726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,4,balanced,0.6258346637090048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,4,balanced,0.9275733629862467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,4,balanced,1.2479146321614583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,4,balanced,1.9177759488423665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,4,balanced,2.5975467363993325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,64,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,64,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,64,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,64,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,64,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,64,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,64,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,64,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,64,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,64,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,64,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,64,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,64,power_law_1.01,0.060819202661514284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,64,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,64,power_law_1.01,0.09728000164031983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,64,power_law_1.01,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,64,power_law_1.01,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,64,power_law_1.01,0.37601280212402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,64,power_law_1.01,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,64,power_law_1.01,0.6565887928009033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,64,power_law_1.01,0.993280029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,64,power_law_1.01,1.529651165008545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,4,power_law_1.2,0.5265408039093018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,4,power_law_1.2,0.7387135982513428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,4,power_law_1.2,0.818995189666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,4,power_law_1.2,0.9121791839599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,4,power_law_1.2,0.9117695808410644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,4,power_law_1.2,0.9234432220458985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,4,power_law_1.2,0.9365311622619629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,4,power_law_1.2,1.2253055572509766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,4,power_law_1.2,1.3766592025756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,4,power_law_1.2,1.284505558013916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,4,power_law_1.2,1.2822527885437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,4,power_law_1.2,1.5429632186889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,4,power_law_1.2,1.5790016174316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,4,power_law_1.2,1.8835456848144532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,4,power_law_1.2,2.1401599884033202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,4,power_law_1.2,2.6251264572143556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,4,power_law_1.2,3.315097427368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,4,power_law_1.2,4.094566345214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,4,power_law_1.2,4.745420837402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,4,power_law_1.2,6.324428939819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,4,power_law_1.2,7.005382537841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,4,power_law_1.2,9.189990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,16,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,16,power_law_1.2,0.0636672019958496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,16,power_law_1.2,0.053439998626708986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,16,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,4,power_law_1.2,10.902528381347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,16,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,16,power_law_1.2,0.0554751992225647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,16,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,16,power_law_1.2,0.05812479853630066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,16,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,16,power_law_1.2,0.057740801572799684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,16,power_law_1.2,0.05936639904975891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,16,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,16,power_law_1.2,0.08536959886550903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,16,power_law_1.2,0.08704000115394592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,16,power_law_1.2,0.12840960025787354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,16,power_law_1.2,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,16,power_law_1.2,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,16,power_law_1.2,0.260915207862854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,16,power_law_1.2,0.3147775888442993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,16,power_law_1.2,0.3669823884963989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,16,power_law_1.2,0.49397759437561034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,16,power_law_1.2,0.693452787399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,16,power_law_1.2,1.043660831451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,16,power_law_1.2,1.5204352378845214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,16,power_law_1.2,2.3267328262329103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,16,power_law_1.2,3.351116943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,4,power_law_1.2,14.268826293945313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,4,power_law_1.2,18.087309265136717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,4,power_law_1.2,22.39569854736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,4,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,4,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,4,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,4,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,4,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,4,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,2,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,4,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,2,power_law_1.01,0.344268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,4,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,2,power_law_1.01,0.5586688041687011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,4,power_law_1.01,0.05300480127334595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,4,power_law_1.01,0.053414398431777955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,2,power_law_1.01,0.7352320194244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,4,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,2,power_law_1.01,0.9848832130432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,4,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,2,power_law_1.01,1.5509504318237304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,4,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,4,power_law_1.01,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,2,power_law_1.01,1.567743968963623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,4,power_law_1.01,0.06611199975013733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,2,power_law_1.01,1.4979071617126465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,4,power_law_1.01,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,4,power_law_1.01,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,2,power_law_1.01,1.6320512771606446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,4,power_law_1.01,0.10219520330429077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,4,power_law_1.01,0.1879680037498474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,2,power_law_1.01,1.6813888549804688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,4,power_law_1.01,0.23610880374908447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,4,power_law_1.01,0.3530751943588257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,2,power_law_1.01,1.6979711532592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,4,power_law_1.01,0.4640768051147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,2,power_law_1.01,1.735251235961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,4,power_law_1.01,0.764518404006958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,2,power_law_1.01,1.7383424758911132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,4,power_law_1.01,1.0975232124328613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,2,power_law_1.01,1.761894416809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,2,power_law_1.01,1.7958911895751952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,4,power_law_1.2,29.575167846679687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,4,power_law_1.01,1.7862655639648437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,2,power_law_1.01,1.8702335357666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,2,power_law_1.01,1.8771968841552735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,4,power_law_1.01,2.3949312210083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,2,power_law_1.01,1.9519168853759765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,2,power_law_1.01,2.1108736038208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,2,power_law_1.01,2.4012544631958006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,2,power_law_1.01,2.5604095458984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,2,power_law_1.01,3.2088062286376955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,2,power_law_1.01,3.3572864532470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,2,power_law_1.01,4.6104576110839846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,2,power_law_1.01,5.88328971862793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,2,power_law_1.01,8.080793762207032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,2,power_law_1.01,10.67356185913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,2,power_law_1.2,0.21831679344177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,2,power_law_1.2,0.33013761043548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,2,power_law_1.2,0.5058559894561767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,2,power_law_1.2,0.7646848201751709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,2,power_law_1.2,0.9771007537841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,2,power_law_1.2,1.6117759704589845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,2,power_law_1.2,1.7119232177734376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,2,power_law_1.2,1.7655807495117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,2,power_law_1.2,1.823334312438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,2,power_law_1.2,1.8536447525024413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,2,power_law_1.2,1.944371223449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,2,power_law_1.2,1.9542015075683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,2,power_law_1.2,2.0572160720825194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,2,power_law_1.2,2.133600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,2,power_law_1.2,2.226790428161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,2,power_law_1.2,2.2859775543212892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,2,power_law_1.2,2.305843162536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,2,power_law_1.2,2.450841522216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,2,power_law_1.2,2.7147903442382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,2,power_law_1.2,3.139993667602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,2,power_law_1.2,3.6317184448242186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,64,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,64,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,64,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,2,power_law_1.2,4.615987014770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,64,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,64,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,64,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,64,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,2,power_law_1.2,5.178777694702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,64,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,64,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,64,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,64,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,64,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,64,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,64,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,64,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,2,power_law_1.2,7.037535858154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,64,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,64,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,64,power_law_1.2,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,64,power_law_1.2,0.10751359462738037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,64,power_law_1.2,0.14807039499282837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,64,power_law_1.2,0.21770238876342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,64,power_law_1.2,0.3741631984710693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,2,power_law_1.2,8.8342529296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,64,power_law_1.2,0.49295358657836913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,64,power_law_1.2,0.7383039951324463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,4,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,4,balanced,0.23825067281723022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,4,balanced,0.45687464872996014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,64,power_law_1.2,0.992255973815918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,4,balanced,0.8751786549886068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,4,balanced,1.715712070465088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,4,balanced,1.772714614868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,4,balanced,1.7797120412190754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,4,balanced,1.7269760767618816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,4,balanced,1.733290672302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,2,power_law_1.2,12.478873443603515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,4,balanced,1.734997272491455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,4,balanced,1.7442132631937664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,4,balanced,1.7585493723551433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,4,balanced,1.7812479337056477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,4,balanced,1.7986559867858887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,4,balanced,1.8416639963785808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,4,balanced,1.85480531056722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,4,balanced,1.8783574104309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,4,balanced,1.9200000762939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,4,balanced,1.9447414080301921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,4,balanced,2.038442611694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,4,balanced,2.0896426836649575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,2,power_law_1.2,15.767141723632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,4,balanced,2.329429308573405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,4,balanced,2.513578732808431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,4,balanced,3.1740585962931314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,4,balanced,3.9098027547200522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,4,balanced,5.722282409667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,4,balanced,7.49124272664388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,8,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,8,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,8,power_law_1.01,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,8,power_law_1.01,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,8,power_law_1.01,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,8,power_law_1.01,0.24944639205932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,8,power_law_1.01,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,8,power_law_1.01,0.27402238845825194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,8,power_law_1.01,0.2617343902587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,8,power_law_1.01,0.2746239900588989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,8,power_law_1.01,0.28631041049957273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,8,power_law_1.01,0.265830397605896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,8,power_law_1.01,0.26398720741271975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,8,power_law_1.01,0.29265921115875243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,8,power_law_1.01,0.31436800956726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,8,power_law_1.01,0.30945279598236086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,8,power_law_1.01,0.33075199127197263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,8,power_law_1.01,0.3762176036834717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,8,power_law_1.01,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,8,power_law_1.01,0.4675583839416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,8,power_law_1.01,0.5326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,8,power_law_1.01,0.6782976150512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,8,power_law_1.01,0.9217920303344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,8,power_law_1.01,1.3803520202636719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,8,power_law_1.01,1.8358272552490233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,8,power_law_1.01,2.7297792434692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,8,power_law_1.01,3.7402622222900392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,1,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,1,power_law_1.2,0.08680959939956664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,8,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,8,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,1,power_law_1.2,0.20971519947052003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,8,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,1,power_law_1.2,0.3221503973007202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,8,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,8,power_law_1.01,0.0403328001499176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,1,power_law_1.2,0.43192319869995116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,8,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,1,power_law_1.2,0.7364607810974121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,8,power_law_1.01,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,1,power_law_1.2,0.7745535850524903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,8,power_law_1.01,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,8,power_law_1.01,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,1,power_law_1.2,0.8169471740722656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,8,power_law_1.01,0.09195520281791687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,1,power_law_1.2,0.8326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,1,power_law_1.2,0.8376319885253907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,8,power_law_1.01,0.12247040271759033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,8,power_law_1.01,0.1275904059410095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,1,power_law_1.2,0.8787839889526368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,1,power_law_1.2,0.9021439552307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,1,power_law_1.2,0.9027584075927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,1,power_law_1.2,0.9201343536376954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,8,power_law_1.01,0.20008959770202636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,1,power_law_1.2,0.9324543952941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,8,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,1,power_law_1.2,0.9654272079467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,1,power_law_1.2,0.9918080329895019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,8,power_law_1.01,0.3637248039245605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,1,power_law_1.2,1.0571776390075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,1,power_law_1.2,1.1161343574523925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,1,power_law_1.2,1.2740608215332032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,1,power_law_1.2,1.4395392417907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,1,power_law_1.2,1.7590272903442383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,8,power_law_1.01,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,8,power_law_1.01,0.7383039951324463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,1,power_law_1.2,2.164512062072754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,8,power_law_1.01,1.0016768455505372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,1,power_law_1.2,2.8892927169799805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,1,power_law_1.2,3.3851390838623048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,8,power_law_1.01,1.6476032257080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,8,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,8,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,8,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,8,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,8,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,8,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,8,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,8,balanced,0.026602665583292644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,8,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,8,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,8,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,8,balanced,0.027642667293548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,8,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,8,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,8,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,8,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,8,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,8,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,8,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,8,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,8,balanced,0.08396800359090169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,8,balanced,0.1367039978504181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,8,balanced,0.2836479942003886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,8,balanced,0.3768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,8,balanced,0.5848480065663656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,8,balanced,0.7946240107218424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,8,power_law_1.01,2.3801855087280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,1,power_law_1.2,4.699750518798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,4,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,4,power_law_1.2,0.03787519931793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,4,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,4,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,4,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,4,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,4,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,4,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,4,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,4,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,4,power_law_1.2,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,4,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,4,power_law_1.2,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,4,power_law_1.2,0.08108800053596496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,4,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,4,power_law_1.2,0.12840319871902467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,4,power_law_1.2,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,8,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,8,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,4,power_law_1.2,0.23244800567626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,8,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,8,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,8,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,8,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,8,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,8,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,4,power_law_1.2,0.2920448064804077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,8,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,8,balanced,0.025413334369659424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,4,power_law_1.2,0.14704639911651612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,8,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,8,balanced,0.02626666675011317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,8,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,8,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,8,balanced,0.03054400036732356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,8,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,4,power_law_1.2,0.15892479419708253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,8,balanced,0.036176001032193504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,8,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,8,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,8,balanced,0.05649066468079885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,8,balanced,0.08072533210118611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,4,power_law_1.2,0.16834559440612792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,8,balanced,0.10785599549611409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,8,balanced,0.22732800245285034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,8,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,4,power_law_1.2,0.35570559501647947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,8,balanced,0.4642133315404256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,4,power_law_1.2,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,8,balanced,0.6324906746546427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,4,power_law_1.2,0.4616191864013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,4,power_law_1.2,0.4462592124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,4,power_law_1.2,0.21831679344177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,4,power_law_1.2,0.4773888111114502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,4,power_law_1.2,0.4438015937805176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,4,power_law_1.2,0.4824831962585449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,4,power_law_1.2,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,4,power_law_1.2,0.5122047901153565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,4,power_law_1.2,0.5560319900512696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,4,power_law_1.2,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,4,power_law_1.2,0.5935103893280029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,4,power_law_1.2,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,4,power_law_1.2,0.745472002029419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,4,power_law_1.2,0.9388031959533691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,4,power_law_1.2,0.319488000869751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,4,power_law_1.2,1.0536959648132325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,4,power_law_1.2,1.4841856002807616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,4,power_law_1.2,1.841561508178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,4,power_law_1.2,2.4559616088867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,4,power_law_1.2,3.3511425018310548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,4,power_law_1.2,0.4083712100982666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,4,power_law_1.2,5.1230720520019535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,4,power_law_1.2,6.28100471496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,4,power_law_1.2,0.5533696174621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,8,power_law_1.01,3.607494354248047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,4,power_law_1.2,0.847871971130371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,4,power_law_1.2,1.0989567756652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,1,power_law_1.2,5.985894393920899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,8,power_law_1.01,4.515635299682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,4,power_law_1.2,1.8984960556030273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,2,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,2,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,64,power_law_1.2,0.321126389503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,2,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,64,power_law_1.2,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,2,power_law_1.01,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,64,power_law_1.2,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,2,power_law_1.01,0.3184639930725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,2,power_law_1.01,0.41244797706604003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,64,power_law_1.2,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,2,power_law_1.01,0.44892158508300783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,64,power_law_1.2,0.22302720546722413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,64,power_law_1.2,0.26910719871520994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,64,power_law_1.2,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,64,power_law_1.2,0.28446719646453855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,64,power_law_1.2,0.2789376020431519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,64,power_law_1.2,0.29982719421386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,2,power_law_1.01,0.6152192115783691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,64,power_law_1.2,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,2,power_law_1.01,0.6223872184753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,2,power_law_1.01,0.6358719825744629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,2,power_law_1.01,0.6080512046813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,64,power_law_1.2,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,2,power_law_1.01,0.6440959930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,64,power_law_1.2,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,2,power_law_1.01,0.6967103958129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,64,power_law_1.2,0.316211199760437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,2,power_law_1.01,0.7073791980743408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,64,power_law_1.2,0.3311615943908691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,2,power_law_1.01,0.7555071830749511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,64,power_law_1.2,0.318668794631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,2,power_law_1.01,0.7927807807922364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,64,power_law_1.2,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,2,power_law_1.01,0.8069120407104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,64,power_law_1.2,0.36433920860290525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,2,power_law_1.01,0.9201663970947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,64,power_law_1.2,0.4122623920440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,2,power_law_1.01,0.993280029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,64,power_law_1.2,0.5244927883148194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,2,power_law_1.01,1.2189696311950684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,64,power_law_1.2,0.558899211883545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,64,power_law_1.2,0.8212479591369629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,2,power_law_1.01,1.4845952033996581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,64,power_law_1.2,0.9402303695678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,2,power_law_1.01,1.8800640106201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,64,power_law_1.2,1.389356803894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,2,power_law_1.01,2.2417407989501954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,4,power_law_1.2,2.101043128967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,2,power_law_1.01,3.0889984130859376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,64,power_law_1.2,2.271027183532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,2,power_law_1.01,3.846758270263672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,64,power_law_1.2,2.936627197265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,2,power_law_1.01,5.441740798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,2,power_law_1.01,7.3787391662597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,64,power_law_1.2,4.375347137451172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,4,power_law_1.2,3.3593345642089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,32,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,32,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,32,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,32,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,32,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,32,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,32,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,32,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,32,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,32,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,32,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,32,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,32,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,32,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,32,power_law_1.2,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,32,power_law_1.2,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,32,power_law_1.2,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,32,power_law_1.2,0.13434879779815673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,32,power_law_1.2,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,32,power_law_1.2,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,32,power_law_1.2,0.4034560203552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,32,power_law_1.2,0.5113855838775635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,32,power_law_1.2,0.6270976066589355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,32,power_law_1.2,1.0782719612121583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,4,power_law_1.2,5.820006561279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,32,power_law_1.2,1.3041600227355956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,32,power_law_1.2,2.3453695297241213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,32,power_law_1.2,0.3215359926223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,32,power_law_1.2,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,32,power_law_1.2,0.2908031940460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,32,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,32,power_law_1.2,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,32,power_law_1.2,0.27832319736480715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,32,power_law_1.2,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,32,power_law_1.2,0.2836479902267456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,32,power_law_1.2,0.265011191368103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,32,power_law_1.2,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,32,power_law_1.2,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,32,power_law_1.2,0.27156479358673097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,32,power_law_1.2,0.2770944118499756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,32,power_law_1.2,0.2830336093902588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,32,power_law_1.2,0.319488000869751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,32,power_law_1.2,0.3131392002105713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,32,power_law_1.2,0.3379199981689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,32,power_law_1.2,0.372326397895813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,32,power_law_1.2,0.40325121879577636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,32,power_law_1.2,0.48721919059753416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,32,power_law_1.2,0.5242879867553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,32,power_law_1.2,0.7180287837982178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,32,power_law_1.2,0.9369600296020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,32,power_law_1.2,1.6736255645751954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,32,power_law_1.2,1.8671615600585938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,32,power_law_1.2,3.4127872467041014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,32,power_law_1.2,4.391731262207031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,16,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,16,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,16,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,16,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,16,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,16,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,16,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,16,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,16,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,16,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,16,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,16,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,16,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,16,power_law_1.01,0.06592640280723572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,16,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,16,power_law_1.01,0.05240960121154785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,16,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,16,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,16,power_law_1.01,0.10792319774627686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,16,power_law_1.01,0.14725120067596437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,16,power_law_1.01,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,16,power_law_1.01,0.2748415946960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,16,power_law_1.01,0.5449728012084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,16,power_law_1.01,0.6739903926849365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,16,power_law_1.01,1.1796480178833009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,16,power_law_1.01,1.7237823486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.044012799859046936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.41738238334655764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.5938879966735839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.8339455604553223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,1,power_law_1.2,1.4632960319519044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,1,power_law_1.2,1.5282112121582032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,1,power_law_1.2,1.6279232025146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,1,power_law_1.2,1.7031167984008788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,1,power_law_1.2,1.725823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,1,power_law_1.2,1.7694719314575196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,1,power_law_1.2,1.7940288543701173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,1,power_law_1.2,1.7993728637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,1,power_law_1.2,1.8329599380493165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,1,power_law_1.2,1.8935808181762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,1,power_law_1.2,1.9406848907470704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,1,power_law_1.2,1.981439971923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,1,power_law_1.2,2.0989952087402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,1,power_law_1.2,2.2544384002685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,32,power_law_1.2,3.021824073791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,1,power_law_1.2,2.5667583465576174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,1,power_law_1.2,2.8389375686645506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,1,power_law_1.2,3.546521759033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,1,power_law_1.2,4.040089416503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,1,power_law_1.2,5.440102386474609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,1,power_law_1.2,6.709452819824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,1,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,1,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,1,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,1,balanced,0.2326186696688334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,1,balanced,0.45073068141937256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,1,balanced,0.4546560049057007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,1,balanced,0.4575573205947876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,1,balanced,0.45960533618927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,1,balanced,0.4628479878107707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,1,balanced,0.48571733633677167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,1,balanced,0.4676266511281331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,1,balanced,0.47547733783721924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,1,balanced,0.4795733292897542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,1,balanced,0.4858880043029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,1,balanced,0.5097813208897909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,1,balanced,0.5171200037002563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,1,balanced,0.5367466608683268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,1,balanced,0.5562026500701904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,1,balanced,0.6135466496149699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,1,balanced,0.706559975941976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,1,balanced,0.8314879735310873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,1,balanced,1.1091626485188801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,1,balanced,1.3383679389953613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,1,balanced,1.8307414054870605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,1,balanced,2.360661347707113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,1,balanced,3.564373334248861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,1,balanced,4.728661219278972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,1,power_law_1.2,9.638092803955079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,16,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,16,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,16,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,16,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,16,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,16,balanced,0.28177066644032794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,16,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,16,balanced,0.28484266996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,16,balanced,0.28757333755493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,16,balanced,0.2872320016225179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,16,balanced,0.2887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,16,balanced,0.28996266921361286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,16,balanced,0.302565336227417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,16,balanced,0.30037333567937213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,16,balanced,0.30532266696294147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,16,balanced,0.30617600679397583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,16,balanced,0.3145386576652527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,16,balanced,0.3351893424987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,16,balanced,0.3524266481399536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,16,balanced,0.38229334354400635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,16,balanced,0.4177866776784261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,16,balanced,0.47018667062123615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,16,balanced,0.5841919978459676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,16,balanced,0.8029867013295492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,16,balanced,1.009493350982666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,16,balanced,1.4371840159098308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,16,balanced,1.8715200424194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,1,power_law_1.2,12.516966247558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,2,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,2,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,2,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,2,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,2,balanced,0.24285866816838583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,2,balanced,0.24524799982706705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,2,balanced,0.24661332368850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,2,balanced,0.2481493353843689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,2,balanced,0.24934399127960205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,2,balanced,0.2510506709416707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,2,balanced,0.24593067169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,2,balanced,0.2491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,2,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,2,balanced,0.2578773299853007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,2,balanced,0.26365866263707477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,2,balanced,0.26845866441726685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,2,balanced,0.2851840058962504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,2,balanced,0.30498133103052777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,2,balanced,0.3141973416010539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,2,balanced,0.35601067543029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,2,balanced,0.3964586655298869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,2,balanced,0.48605867226918537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,2,balanced,0.6078826586405436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,2,balanced,0.8934400081634521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,2,balanced,1.1665066878000896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,2,balanced,1.715712070465088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,2,balanced,2.2275412877400718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,1,balanced,0.5695146719614664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,1,balanced,1.0361173152923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,1,balanced,2.017279942830404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,1,balanced,2.11080535252889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,1,balanced,2.067626635233561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,1,balanced,2.0522665977478027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,1,balanced,2.0657493273417153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,1,balanced,2.0776960055033364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,1,balanced,2.0850346883138022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,1,balanced,2.0968052546183267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,1,balanced,2.12172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,1,balanced,2.152618726094564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.33177599906921384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,1,balanced,2.182485262552897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.5873663902282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,1,balanced,2.3208959897359214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,1,power_law_1.2,1.0565631866455079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,1,balanced,2.3517866134643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,1,power_law_1.2,1.702707290649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,1,balanced,2.3895039558410645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,1,balanced,2.500607967376709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,1,power_law_1.2,2.27061767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,1,balanced,3.4391040802001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,1,power_law_1.2,4.151705551147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,1,balanced,3.667114575703939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,1,balanced,4.641450564066569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,1,power_law_1.2,4.486553573608399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,1,balanced,5.386240005493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,1,power_law_1.2,4.785356903076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,1,power_law_1.2,4.803174209594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,1,balanced,7.128063837687175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,1,power_law_1.2,4.98155517578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,1,balanced,8.947882970174154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,1,power_law_1.2,5.248806381225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,1,power_law_1.2,5.384396743774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,1,balanced,12.582740783691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,1,power_law_1.2,5.337907028198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,1,power_law_1.2,5.443379211425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,1,balanced,17.248767852783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,1,power_law_1.2,5.670297622680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,1,power_law_1.2,5.780889511108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,1,power_law_1.2,5.960294342041015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,1,balanced,25.179306030273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,1,power_law_1.2,6.253772735595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,1,power_law_1.2,6.5943550109863285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,1,power_law_1.2,7.0252540588378904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,1,balanced,33.06512959798177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,1,power_law_1.2,7.553228759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,1,power_law_1.2,9.210470581054688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,1,power_law_1.2,9.79046401977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,1,power_law_1.2,12.603187561035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,2,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,2,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,2,balanced,0.05357866485913595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,2,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,2,balanced,0.0766293356815974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,2,balanced,0.2913279930750529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,2,balanced,0.411135991414388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,2,balanced,0.4227413336435954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,2,balanced,0.4288853406906128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,2,balanced,0.43263999621073407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,2,balanced,0.43161598841349286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,2,balanced,0.44407467047373456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,2,balanced,0.45174400011698407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,2,balanced,0.4667733510335286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,2,balanced,0.4819626808166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,2,balanced,0.49937065442403156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,2,balanced,0.5319413344065348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,2,balanced,0.6092480023701986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,1,power_law_1.2,15.411814880371093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,2,balanced,0.6703786849975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,2,balanced,0.8516266345977783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,2,balanced,1.051477352778117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,2,balanced,1.4402559598286946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,2,balanced,1.8310826619466145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,2,balanced,2.6308266321818032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,2,balanced,3.4761387507120767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,2,balanced,5.196799914042155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,2,balanced,6.929066975911458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,1,power_law_1.2,21.35552062988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,4,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,4,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,4,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,4,balanced,0.19490132729212442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,4,balanced,0.36522666613260907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,4,balanced,0.4869120121002197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,4,balanced,0.4889599879582723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,4,balanced,0.4870826800664266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,4,balanced,0.48930132389068604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,4,balanced,0.4899839957555135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,4,balanced,0.49237334728240967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,4,balanced,0.49561599890391034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,4,balanced,0.49766401449839276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,4,balanced,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,4,balanced,0.5092693169911703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,4,balanced,0.5118293364842733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,4,balanced,0.5193386475245158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,4,balanced,0.5200213193893433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,4,balanced,0.5346986850102743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,4,balanced,0.5620053211847941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,4,balanced,0.5894826650619507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,4,balanced,0.6584320068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,4,balanced,0.7301119963328043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,4,balanced,0.9149440129597982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,4,balanced,1.1098453203837078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,4,balanced,1.6034132639567058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,4,balanced,1.9568640391031902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,1,power_law_1.2,27.026431274414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,2,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,2,power_law_1.01,0.16752640008926392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,2,power_law_1.01,0.26869759559631345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,2,power_law_1.01,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,2,power_law_1.01,0.44810237884521487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,2,power_law_1.01,0.7415808200836181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,2,power_law_1.01,0.7573503971099853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,2,power_law_1.01,0.841318416595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,2,power_law_1.01,0.8656895637512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,2,power_law_1.01,0.8470527648925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,2,power_law_1.01,0.8337408065795898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,2,power_law_1.01,0.881868839263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,2,power_law_1.01,0.9058112144470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,2,power_law_1.01,0.9367551803588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,2,power_law_1.01,0.9480192184448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,2,power_law_1.01,0.9209856033325196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,2,power_law_1.01,0.9920512199401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,2,power_law_1.01,1.0313728332519532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,2,power_law_1.01,1.070899200439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,2,power_law_1.01,1.2146688461303712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,2,power_law_1.01,1.3080575942993165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,2,power_law_1.01,1.5534079551696778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,2,power_law_1.01,1.8079744338989259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,2,power_law_1.01,2.429132843017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,2,power_law_1.01,2.6071039199829102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,2,power_law_1.01,3.580518341064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,2,power_law_1.01,4.601235198974609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,8,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,8,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,8,balanced,0.04214933514595032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,8,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,8,balanced,0.04435733457406362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,8,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,8,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,8,balanced,0.05068266888459524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,8,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,8,balanced,0.05750399827957153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,8,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,8,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,8,balanced,0.07458133498827617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,8,balanced,0.07560533285140991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,8,balanced,0.08891733487447102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,8,balanced,0.1155413289864858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,8,balanced,0.13226667046546936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,8,balanced,0.233130673567454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,8,balanced,0.26947200298309326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,8,balanced,0.41574398676554364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,8,balanced,0.5251413186391195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,8,balanced,0.8210773468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,8,balanced,1.0968746344248455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,8,balanced,1.6235520044962566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,8,balanced,2.163029352823893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,8,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,8,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,8,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,8,power_law_1.01,0.04094719886779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,8,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,8,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,8,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,8,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,8,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,8,power_law_1.01,0.09768959879875183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,8,power_law_1.01,0.12410880327224731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,8,power_law_1.01,0.14254080057144164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,8,power_law_1.01,0.16977280378341675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,8,power_law_1.01,0.16997120380401612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,8,power_law_1.01,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,8,power_law_1.01,0.2553855895996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,8,power_law_1.01,0.42639360427856443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,8,power_law_1.01,0.4966400146484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,8,power_law_1.01,0.7395328044891357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,8,power_law_1.01,0.9926464080810546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,8,power_law_1.01,1.4532608032226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,8,power_law_1.01,1.7113088607788085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,4,power_law_1.01,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,4,power_law_1.01,0.4777984142303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,4,power_law_1.01,0.4230912208557129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,4,power_law_1.01,0.530022382736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,4,power_law_1.01,0.5279744148254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,4,power_law_1.01,0.5349376201629639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,4,power_law_1.01,0.5406720161437988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,4,power_law_1.01,0.6746111869812011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,8,power_law_1.01,2.6656639099121096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,4,power_law_1.01,0.6656000137329101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,4,power_law_1.01,0.7129087924957276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,4,power_law_1.01,0.705734395980835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,4,power_law_1.01,0.7956480026245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,4,power_law_1.01,0.8048640251159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,4,power_law_1.01,0.9474047660827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,4,power_law_1.01,1.065779209136963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,4,power_law_1.01,1.1071488380432128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,4,power_law_1.01,1.274873638153076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,4,power_law_1.01,1.7014783859252929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,4,power_law_1.01,1.8567167282104493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,4,power_law_1.01,2.2849536895751954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,8,power_law_1.01,3.8971393585205076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,4,power_law_1.01,2.751897621154785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,4,power_law_1.01,3.7785598754882814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,4,power_law_1.01,4.268236923217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,8,power_law_1.01,5.647155380249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,1,balanced,0.1996799906094869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,1,balanced,0.35276798407236737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,1,balanced,0.6719146569569906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,1,balanced,1.3056000073750813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,1,balanced,2.612053394317627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,32,power_law_1.01,0.6248447895050049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,1,balanced,5.084159851074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,32,power_law_1.01,0.8241151809692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,32,power_law_1.01,0.8212479591369629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,1,balanced,5.103957176208496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,32,power_law_1.01,0.8210432052612304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,32,power_law_1.01,0.8237055778503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,1,balanced,5.120170593261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,32,power_law_1.01,0.7333888053894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,1,balanced,5.137749354044597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,32,power_law_1.01,0.7684095859527588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,32,power_law_1.01,0.7251967906951904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,1,balanced,5.151914596557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,32,power_law_1.01,0.746291208267212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,32,power_law_1.01,0.7700479984283447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,1,balanced,5.180245399475098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,32,power_law_1.01,0.8013824462890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,8,power_law_1.01,6.5773567199707035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,32,power_law_1.01,0.7481344223022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,1,balanced,5.204991976420085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,32,power_law_1.01,0.7604224205017089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,32,power_law_1.01,0.7276544094085693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,1,balanced,5.229909261067708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,32,power_law_1.01,0.7614463806152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,32,power_law_1.01,0.76943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,32,power_law_1.01,0.7962624073028565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,1,balanced,5.273941357930501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,32,power_law_1.01,0.8515583992004394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,32,power_law_1.01,0.9297920227050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,1,balanced,5.311477343241374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,32,power_law_1.01,1.0160063743591308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,32,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,1,balanced,5.3524424235026045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,32,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,4,power_law_1.01,6.285516738891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,32,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,32,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,1,balanced,5.426005045572917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,32,power_law_1.01,1.0883071899414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,1,balanced,5.554858525594075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,32,power_law_1.01,1.4028800010681153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,32,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,32,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,32,power_law_1.01,1.5841279983520509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,32,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,1,balanced,5.692757288614909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,32,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,32,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,32,power_law_1.01,2.1348352432250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,32,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,32,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,1,balanced,5.954048156738281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,32,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,32,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,32,power_law_1.01,2.7367359161376954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,32,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,32,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,1,balanced,6.228138605753581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,32,power_law_1.01,0.045664000511169436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,32,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,32,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,32,power_law_1.01,3.9880702972412108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,32,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,32,power_law_1.01,0.07802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,32,power_law_1.01,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,1,balanced,6.977024078369141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,32,power_law_1.01,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,32,power_law_1.01,0.20480000972747803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,32,power_law_1.01,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,32,power_law_1.01,5.148467254638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,1,balanced,7.445333480834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,32,power_law_1.01,0.42229762077331545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,32,power_law_1.01,0.6854656219482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,32,power_law_1.01,0.9070591926574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,1,balanced,7.784789403279622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,1,balanced,8.831317265828451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,1,balanced,11.208021799723307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,1,balanced,14.03989283243815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,4,power_law_1.01,9.073868560791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,4,power_law_1.01,12.106739044189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,1,power_law_1.01,0.5851136207580566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,1,power_law_1.01,1.0438336372375487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,1,power_law_1.01,2.0105215072631837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,1,power_law_1.01,3.9786495208740233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,1,power_law_1.01,6.164684677124024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,1,power_law_1.01,7.947468566894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,1,power_law_1.01,11.642880249023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,1,power_law_1.01,11.806310272216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,1,power_law_1.01,12.293325042724609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,1,power_law_1.01,12.581068420410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,1,power_law_1.01,1.1284480094909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,1,power_law_1.01,2.196268844604492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,1,power_law_1.01,4.340518569946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,1,power_law_1.01,13.11658172607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,1,power_law_1.01,7.103282928466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,1,power_law_1.01,13.425050354003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,1,power_law_1.01,9.823846435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,1,power_law_1.01,13.569229125976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,1,power_law_1.01,16.80015411376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,1,power_law_1.01,13.732453918457031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,1,power_law_1.01,17.637376403808595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,1,power_law_1.01,14.597734069824218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,1,power_law_1.01,17.979391479492186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,1,power_law_1.01,14.491853332519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,4,power_law_1.01,14.25305633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,1,power_law_1.01,15.02472381591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,1,power_law_1.01,18.470501708984376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,1,power_law_1.01,15.412403869628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,1,power_law_1.01,19.038616943359376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,1,power_law_1.01,16.616242980957033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,1,power_law_1.01,19.542425537109374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,1,power_law_1.01,17.294297790527345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,1,power_law_1.01,19.839385986328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,1,power_law_1.01,18.881741333007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,1,power_law_1.01,20.026573181152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,1,power_law_1.01,21.417971801757812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,32,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,32,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,32,power_law_1.01,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,32,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,32,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,32,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,32,power_law_1.01,0.03788160085678101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,32,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,32,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,32,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,1,power_law_1.01,21.65391387939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,32,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,32,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,32,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,32,power_law_1.01,0.046060800552368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,32,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,32,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,32,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,1,power_law_1.01,21.623808288574217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,32,power_law_1.01,0.09195520281791687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,32,power_law_1.01,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,32,power_law_1.01,0.15134719610214234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,32,power_law_1.01,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,32,power_law_1.01,0.37560319900512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,32,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,32,power_law_1.01,0.7618559837341309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,1,power_law_1.01,22.270771789550782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,32,power_law_1.01,1.0440704345703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,1,power_law_1.01,24.938291931152342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,1,power_law_1.01,22.960333251953124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,1,power_law_1.01,32.4284423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,1,power_law_1.01,22.92674560546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,1,power_law_1.01,24.1364990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,1,power_law_1.01,42.00837097167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,1,power_law_1.01,25.362841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,1,power_law_1.01,26.7399169921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,1,power_law_1.01,51.98602294921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,1,power_law_1.01,31.669656372070314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,1,power_law_1.01,36.737432861328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,1,power_law_1.01,34.29683227539063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,1,power_law_1.01,42.90007019042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,1,power_law_1.01,49.1767822265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,1,power_law_1.01,65.09424438476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,1,power_law_1.01,80.08683471679687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,8,balanced,0.30446932713190716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,8,balanced,0.2728959918022156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,8,balanced,0.2723840077718099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,8,balanced,0.2730666597684224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,8,balanced,0.27477333943049115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,8,balanced,0.2759679953257243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,8,balanced,0.2774933377901713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,8,balanced,0.2786986629168193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,8,balanced,0.28125866254170734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,8,balanced,0.2821120023727417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,8,balanced,0.2845013340314229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,8,balanced,0.3322880069414775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,8,balanced,0.3351893424987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,8,balanced,0.292522668838501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,8,balanced,0.33740798632303876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,8,balanced,0.3490133285522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,8,balanced,0.3717120091120402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,8,balanced,0.5181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,8,balanced,0.6311253309249878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,8,balanced,0.8110026518503824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,8,balanced,0.9408853054046631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,8,balanced,1.257813294728597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,8,balanced,1.5015254020690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,8,balanced,1.9761494000752766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,8,balanced,2.5180160204569497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,8,balanced,3.554133415222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,8,balanced,4.542293230692546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,4,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,4,power_law_1.2,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,4,power_law_1.2,0.30208001136779783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,4,power_law_1.2,0.44175357818603517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,4,power_law_1.2,0.5398528099060058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,4,power_law_1.2,0.6135744094848633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,4,power_law_1.2,0.9193471908569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,4,power_law_1.2,0.8781824111938477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,4,power_law_1.2,0.9009152412414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,4,power_law_1.2,0.8923135757446289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,4,power_law_1.2,0.9201663970947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,4,power_law_1.2,0.9005056381225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,4,power_law_1.2,0.9392127990722656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,4,power_law_1.2,0.971776008605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,4,power_law_1.2,1.0012672424316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,4,power_law_1.2,1.0584063529968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,4,power_law_1.2,1.1034624099731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,4,power_law_1.2,1.1812864303588868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,4,power_law_1.2,1.2922880172729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,4,power_law_1.2,1.4354304313659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,4,power_law_1.2,1.64270076751709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,4,power_law_1.2,1.9716096878051759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,4,power_law_1.2,2.4856576919555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,4,power_law_1.2,3.4971649169921877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,4,power_law_1.2,4.4746753692626955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,4,power_law_1.2,6.321152114868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,4,power_law_1.2,6.495231628417969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,2,power_law_1.2,0.3446784019470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,2,power_law_1.2,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,2,power_law_1.2,0.6862847805023193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,2,power_law_1.2,1.0008576393127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,2,power_law_1.2,1.3959168434143066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,2,power_law_1.2,2.1946367263793944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,2,power_law_1.2,2.327961540222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,2,power_law_1.2,2.3937023162841795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,2,power_law_1.2,2.4264703750610352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,2,power_law_1.2,2.547097587585449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,2,power_law_1.2,2.6753023147583006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,2,power_law_1.2,2.7123584747314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,2,power_law_1.2,2.6605567932128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,2,power_law_1.2,2.806374359130859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,2,power_law_1.2,2.8432384490966798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,2,power_law_1.2,2.881920051574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,4,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,4,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,4,power_law_1.2,0.036627200245857236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,4,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,2,power_law_1.2,2.975129508972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,4,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,4,power_law_1.2,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,4,power_law_1.2,0.04379520118236542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,4,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,2,power_law_1.2,3.1920127868652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,4,power_law_1.2,0.054662400484085084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,4,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,4,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,4,power_law_1.2,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,2,power_law_1.2,3.346636962890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,4,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,4,power_law_1.2,0.10115840435028076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,4,power_law_1.2,0.11612160205841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,2,power_law_1.2,3.637247848510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,2,power_law_1.2,3.964313507080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,4,power_law_1.2,0.1509376049041748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,2,power_law_1.2,4.856422424316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,4,power_law_1.2,0.17100800275802613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,16,power_law_1.2,0.31989760398864747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,4,power_law_1.2,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,16,power_law_1.2,0.5107711791992188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,16,power_law_1.2,0.4403200149536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,16,power_law_1.2,0.547430419921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,16,power_law_1.2,0.5609471797943115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,16,power_law_1.2,0.5007296085357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,16,power_law_1.2,0.43909120559692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,4,power_law_1.2,0.35059199333190916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,16,power_law_1.2,0.4941823959350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,2,power_law_1.2,5.395455932617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,16,power_law_1.2,0.46530561447143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,16,power_law_1.2,0.46735358238220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,16,power_law_1.2,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,16,power_law_1.2,0.47902722358703614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,4,power_law_1.2,0.5079040050506591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,16,power_law_1.2,0.528384017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,16,power_law_1.2,0.5113855838775635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,16,power_law_1.2,0.5089280128479003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,16,power_law_1.2,0.5840896129608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,16,power_law_1.2,0.588595199584961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,16,power_law_1.2,0.6111231803894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,2,power_law_1.2,7.394509124755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,16,power_law_1.2,0.6715392112731934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,16,power_law_1.2,0.7935999870300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,16,power_law_1.2,0.8943615913391113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,16,power_law_1.2,1.131110382080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,16,power_law_1.2,1.3524991989135742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,2,power_law_1.2,8.902861022949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,16,power_law_1.2,2.060083198547363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,16,power_law_1.2,2.6294271469116213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,4,power_law_1.2,0.596992015838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,16,power_law_1.2,3.955507278442383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,16,power_law_1.2,5.045043182373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,2,power_law_1.2,12.424601745605468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,4,power_law_1.2,1.0010623931884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,4,power_law_1.2,1.2519424438476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,2,power_law_1.2,16.001434326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,4,power_law_1.2,1.9222400665283204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,4,power_law_1.2,2.815385627746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,4,power_law_1.2,0.030502399802207945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,4,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,4,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,4,power_law_1.2,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,4,power_law_1.2,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,4,power_law_1.2,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,4,power_law_1.2,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,4,power_law_1.2,0.23367679119110107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,4,power_law_1.2,0.2396159887313843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,4,power_law_1.2,0.23306241035461425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,4,power_law_1.2,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,4,power_law_1.2,0.264192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,4,power_law_1.2,0.26869759559631345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,4,power_law_1.2,0.2631680011749268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,4,power_law_1.2,0.23490560054779053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,4,power_law_1.2,0.28199679851531984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,4,power_law_1.2,0.28917760848999025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,2,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,4,power_law_1.2,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,2,power_law_1.01,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,4,power_law_1.2,0.3190783977508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,2,power_law_1.01,0.03193599879741669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,2,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,4,power_law_1.2,0.3569664001464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,2,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,2,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,4,power_law_1.2,0.4034560203552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,2,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,2,power_law_1.01,0.041971200704574586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,4,power_law_1.2,0.4863999843597412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,2,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,2,power_law_1.01,0.048102399706840514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,2,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,2,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,2,power_law_1.01,0.07348480224609374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,4,power_law_1.2,0.586956787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,2,power_law_1.01,0.0843775987625122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,4,power_law_1.2,0.8566783905029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,2,power_law_1.01,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,2,power_law_1.01,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,2,power_law_1.01,0.15645439624786378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,2,power_law_1.01,0.2091007947921753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,4,power_law_1.2,1.1431936264038085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,2,power_law_1.01,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,2,power_law_1.01,0.35778560638427737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,2,power_law_1.01,0.4364287853240967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,4,power_law_1.2,1.5210495948791505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,2,power_law_1.01,0.6858751773834229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,4,power_law_1.2,2.1272512435913087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,2,power_law_1.01,0.8527872085571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,2,power_law_1.01,1.2056575775146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,4,power_law_1.2,3.9251968383789064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,2,power_law_1.01,1.8782207489013671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,32,power_law_1.2,0.05221760272979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,32,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,32,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,32,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,32,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,32,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,32,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,32,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,32,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,32,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,32,power_law_1.2,0.042387199401855466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,32,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,32,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,32,power_law_1.2,0.04873600006103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,32,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,32,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,32,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,4,power_law_1.2,5.680742263793945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,32,power_law_1.2,0.07923840284347534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,32,power_law_1.2,0.09441279768943786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,32,power_law_1.2,0.12328959703445434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,32,power_law_1.2,0.15421439409255983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,32,power_law_1.2,0.2695168018341064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,32,power_law_1.2,0.3469311952590942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,32,power_law_1.2,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,32,power_law_1.2,0.6651904106140136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,32,power_law_1.2,1.1216896057128907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,32,power_law_1.2,1.5185919761657716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,2,power_law_1.01,3.2288768768310545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,1,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,1,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,1,power_law_1.2,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,1,power_law_1.2,0.535539197921753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,2,power_law_1.01,3.504742431640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,1,power_law_1.2,0.8599488258361816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,1,power_law_1.2,1.1931648254394531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,1,power_law_1.2,1.4225407600402833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,1,power_law_1.2,1.9875839233398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,1,power_law_1.2,2.1122880935668946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,1,power_law_1.2,2.1393407821655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,1,power_law_1.2,2.30645751953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,1,power_law_1.2,2.3775232315063475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,1,power_law_1.2,2.450432014465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,1,power_law_1.2,2.514944076538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,1,power_law_1.2,2.656255912780762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,1,power_law_1.2,2.730188751220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,1,power_law_1.2,2.8858367919921877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,1,power_law_1.2,3.118079948425293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,1,power_law_1.2,3.380633544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,1,power_law_1.2,3.7558273315429687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,1,power_law_1.2,4.165427017211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,4,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,4,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,4,power_law_1.2,0.06880000233650208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,1,power_law_1.2,4.913356781005859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,4,power_law_1.2,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,4,power_law_1.2,0.18001919984817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,4,power_law_1.2,0.2541568040847778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,1,power_law_1.2,5.868544006347657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,4,power_law_1.2,0.2942975997924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,4,power_law_1.2,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,4,power_law_1.2,0.35921919345855713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,4,power_law_1.2,0.3168256044387817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,1,power_law_1.2,7.331839752197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,4,power_law_1.2,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,4,power_law_1.2,0.3680255889892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,4,power_law_1.2,0.36474881172180174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,4,power_law_1.2,0.3749887943267822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,4,power_law_1.2,0.3919872045516968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,4,power_law_1.2,0.41984000205993655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,1,power_law_1.2,8.985804748535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,4,power_law_1.2,0.4302847862243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,4,power_law_1.2,0.4802559852600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,4,power_law_1.2,0.5758975982666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,4,power_law_1.2,0.6811647891998291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,4,power_law_1.2,0.8648703575134278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,4,power_law_1.2,1.2949503898620605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,4,power_law_1.2,1.5417344093322753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,1,power_law_1.2,12.215705871582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,4,power_law_1.2,2.1839872360229493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,4,power_law_1.2,2.872319984436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,4,power_law_1.2,4.219084930419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,1,power_law_1.2,14.964735412597657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,4,power_law_1.2,5.869772720336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,128,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,128,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,128,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,128,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,128,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,128,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,128,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,128,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,128,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,128,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,128,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,128,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,128,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,128,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,128,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,128,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,128,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,128,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,128,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,128,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,128,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,128,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,128,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,128,balanced,0.06911999980608623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,128,balanced,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,128,balanced,0.2730666597684224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,128,balanced,0.3573760191599528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,16,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,16,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,16,power_law_1.01,0.02210559993982315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,16,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,16,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,16,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,16,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,16,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,16,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,16,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,16,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,16,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,16,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,16,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,16,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,16,power_law_1.01,0.06488959789276123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,16,power_law_1.01,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,16,power_law_1.01,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,16,power_law_1.01,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,16,power_law_1.01,0.1464319944381714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,16,power_law_1.01,0.16711679697036744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,16,power_law_1.01,0.33873920440673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,16,power_law_1.01,0.47737598419189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,16,power_law_1.01,0.6811647891998291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,16,power_law_1.01,1.0182656288146972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,8,power_law_1.01,0.580403184890747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,8,power_law_1.01,1.0358783721923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,8,power_law_1.01,1.3105152130126954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,8,power_law_1.01,1.4604031562805175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,8,power_law_1.01,1.6322559356689452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,8,power_law_1.01,1.5890432357788087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,8,power_law_1.01,1.8130624771118165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,8,power_law_1.01,1.5857664108276368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,8,power_law_1.01,1.7864704132080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,8,power_law_1.01,1.718886375427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,8,power_law_1.01,1.816166305541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,8,power_law_1.01,1.7287168502807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,8,power_law_1.01,1.757593536376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,8,power_law_1.01,1.8937856674194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,8,power_law_1.01,1.8354175567626954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,8,power_law_1.01,2.024819183349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,2,balanced,0.027114666998386383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,2,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,2,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,2,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,2,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,2,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,2,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,2,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,2,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,2,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,8,power_law_1.01,2.0346879959106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,2,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,2,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,2,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,2,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,2,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,2,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,2,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,2,balanced,0.09591466188430786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,2,balanced,0.0897706647713979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,2,balanced,0.15308800339698792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,2,balanced,0.16639999548594156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,2,balanced,0.2821120023727417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,2,balanced,0.3998560110727946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,2,balanced,0.6202026605606079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,2,balanced,0.8901973565419515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,2,balanced,1.3566293716430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,8,power_law_1.01,2.1114879608154298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,2,balanced,1.8227200508117676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,8,power_law_1.01,2.1815296173095704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,8,power_law_1.01,2.2554624557495115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,8,power_law_1.01,2.5198591232299803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,8,power_law_1.01,2.872115135192871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,8,power_law_1.01,3.5016704559326173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,8,power_law_1.01,4.436377716064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,8,power_law_1.01,5.27196159362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,8,power_law_1.01,7.631053161621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,8,power_law_1.01,9.990118408203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,4,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,4,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,4,balanced,0.10257066289583842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,4,balanced,0.3107840021451314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,4,balanced,0.38467200597127277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,4,balanced,0.38758401075998944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,4,balanced,0.3887786865234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,4,balanced,0.39099733034769696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,4,balanced,0.3940693140029907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,4,balanced,0.3993599812189738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,4,balanced,0.40584532419840497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,4,balanced,0.41096532344818115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,4,balanced,0.42291200160980225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,4,balanced,0.434005339940389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,4,balanced,0.4416853189468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,4,balanced,0.4602880080540975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,4,balanced,0.49800535043080646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,4,balanced,0.5254826545715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,4,balanced,0.5899946689605713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,4,balanced,0.6864213148752848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,4,balanced,0.9444693724314371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,4,balanced,1.1857813199361165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,4,balanced,1.711957295735677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,4,balanced,2.221567948659261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,4,balanced,3.2269652684529624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,4,balanced,4.244480133056641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,64,power_law_1.01,0.19005440473556517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,64,power_law_1.01,0.18984960317611693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,64,power_law_1.01,0.18903039693832396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,64,power_law_1.01,0.1892351984977722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,64,power_law_1.01,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,64,power_law_1.01,0.1461951971054077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,64,power_law_1.01,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,64,power_law_1.01,0.1937407970428467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,64,power_law_1.01,0.14991359710693358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,64,power_law_1.01,0.14970879554748534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,64,power_law_1.01,0.19353599548339845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,64,power_law_1.01,0.19394559860229493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,64,power_law_1.01,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,64,power_law_1.01,0.12714879512786864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,64,power_law_1.01,0.20336639881134033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,64,power_law_1.01,0.1669119954109192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,64,power_law_1.01,0.14950400590896606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,64,power_law_1.01,0.20869119167327882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,64,power_law_1.01,0.18391040563583375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,64,power_law_1.01,0.2617023944854736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,64,power_law_1.01,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,64,power_law_1.01,0.41246719360351564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,64,power_law_1.01,0.4947840213775635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,64,power_law_1.01,0.7301119804382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,64,power_law_1.01,0.849510383605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,64,power_law_1.01,1.2247039794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,64,power_law_1.01,1.8049024581909179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,2,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,2,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,2,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,2,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,2,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,2,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,2,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,2,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,2,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,2,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,2,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,2,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,2,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,2,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,2,balanced,0.08328533172607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,2,balanced,0.11127466956774394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,2,balanced,0.16964266697565714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,2,balanced,0.2135039965311686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,2,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,2,balanced,0.3295573393503825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,2,balanced,0.44441600640614826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,2,balanced,0.7212373415629069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,2,balanced,1.0221227010091145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,2,balanced,1.5982933044433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,2,balanced,2.1949440638224282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,2,balanced,3.336533228556315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,2,balanced,4.467370669047038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,32,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,32,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,32,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,32,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,32,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,32,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,32,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,32,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,32,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,32,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,32,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,32,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,32,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,32,power_law_1.01,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,32,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,32,power_law_1.01,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,32,power_law_1.01,0.1662976026535034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,32,power_law_1.01,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.9256704330444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,32,power_law_1.01,0.3645440101623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,32,power_law_1.01,0.5789696216583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,1,power_law_1.2,1.3774847984313965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,32,power_law_1.01,0.7516160011291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,1,power_law_1.2,1.880678367614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,32,power_law_1.01,1.1876288414001466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,1,power_law_1.2,2.9065216064453123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,32,power_law_1.01,1.7715200424194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,1,power_law_1.2,3.0062463760375975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,1,power_law_1.2,3.176646423339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,1,power_law_1.2,3.2415744781494142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,1,power_law_1.2,3.3921024322509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,1,power_law_1.2,3.5327999114990236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,1,power_law_1.2,3.562700653076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,1,power_law_1.2,3.7294078826904298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,1,power_law_1.2,3.974924850463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,1,power_law_1.2,4.060569763183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,1,power_law_1.2,4.260863876342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,1,power_law_1.2,4.502732849121093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,1,power_law_1.2,4.883046340942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,1,power_law_1.2,5.370060729980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,1,power_law_1.2,5.7622528076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,1,power_law_1.2,6.80263671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,1,power_law_1.2,7.964876556396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,1,power_law_1.2,10.412025451660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,1,power_law_1.2,12.476416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,1,power_law_1.2,17.282867431640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,1,power_law_1.2,20.412211608886718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,8,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,8,balanced,0.03685333331425985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,8,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,8,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,8,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,8,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,8,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,8,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,8,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,8,balanced,0.052560001611709595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,8,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,8,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,8,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,8,balanced,0.08379733562469482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,8,balanced,0.09830400347709656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,8,balanced,0.11571199695269267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,8,balanced,0.1378986636797587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,8,balanced,0.23125332593917847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,8,balanced,0.2867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,8,balanced,0.48452266057332355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,8,balanced,0.6678187052408854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,8,balanced,1.0376533667246501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,8,balanced,1.401685396830241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,64,balanced,0.036159999668598175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,64,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,64,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,64,balanced,0.033941333492596946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,64,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,64,balanced,0.0354720006386439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,64,balanced,0.03614933292071024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,64,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,64,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,64,balanced,0.036858665446440377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,64,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,64,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,64,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,64,balanced,0.04009599983692169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,64,balanced,0.04264000058174133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,64,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,64,balanced,0.04573333263397217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,64,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,64,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,64,balanced,0.06279466549555461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,64,balanced,0.0727040022611618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,64,balanced,0.08754133184750874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,64,balanced,0.105813334385554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,64,balanced,0.16025066375732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,64,balanced,0.18926932414372763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,64,balanced,0.36061867078145343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,64,balanced,0.4590933322906494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,4,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,4,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,4,balanced,0.05340800185998281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,4,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,4,balanced,0.08038400113582611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,4,balanced,0.1971199909845988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,4,balanced,0.19797333081563315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,4,balanced,0.20428800582885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,4,balanced,0.20718934138615927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,4,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,4,balanced,0.21179733673731485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,4,balanced,0.21555199225743613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,4,balanced,0.2182826598485311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,4,balanced,0.22630399465560913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,4,balanced,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,4,balanced,0.24166399240493774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,4,balanced,0.2583893338839213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,4,balanced,0.3037866751352946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,4,balanced,0.32870399951934814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,4,balanced,0.4118186632792155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,4,balanced,0.4792319933573405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,4,balanced,0.7277226448059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,4,balanced,0.9794399738311768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,4,balanced,1.5353172620137532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,4,balanced,2.024789333343506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,4,balanced,2.8957014083862305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,4,balanced,4.041045188903809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,8,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,8,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,8,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,8,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,8,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,8,power_law_1.01,0.05262079834938049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,8,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,8,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,8,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,8,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,8,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,8,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,8,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,8,power_law_1.01,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,8,power_law_1.01,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,8,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,8,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,8,power_law_1.01,0.09318400025367737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,8,power_law_1.01,0.15278079509735107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,8,power_law_1.01,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,8,power_law_1.01,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,8,power_law_1.01,0.48435201644897463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,8,power_law_1.01,0.6727680206298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,8,power_law_1.01,1.0434559822082519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,8,power_law_1.01,1.4948351860046387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,8,power_law_1.01,2.429132843017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,8,power_law_1.01,3.400908660888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,2,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,2,power_law_1.2,0.06674559712409973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,2,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,2,power_law_1.2,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,2,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,2,power_law_1.2,0.38399999141693114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,2,power_law_1.2,0.3811327934265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,2,power_law_1.2,0.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,2,power_law_1.2,0.55763840675354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,2,power_law_1.2,0.562995195388794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,2,power_law_1.2,0.669491195678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,2,power_law_1.2,0.6385663986206055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,2,power_law_1.2,0.6234111785888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,2,power_law_1.2,0.6878848075866699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,2,power_law_1.2,0.7325376033782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,2,power_law_1.2,0.7837696075439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,2,power_law_1.2,0.8534015655517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,2,power_law_1.2,0.973414421081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,2,power_law_1.2,1.1134976387023925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,2,power_law_1.2,1.4034943580627441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,2,power_law_1.2,1.6756736755371093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,2,power_law_1.2,2.1995519638061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,2,power_law_1.2,2.6589183807373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,2,power_law_1.2,3.6544254302978514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,2,power_law_1.2,4.7032318115234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,2,power_law_1.2,7.230873870849609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,2,power_law_1.2,9.25634536743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,32,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,32,power_law_1.2,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,32,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,32,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,32,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,32,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,32,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,32,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,32,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,32,power_law_1.2,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,32,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,32,power_law_1.2,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,32,power_law_1.2,0.07451519966125489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,32,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,32,power_law_1.2,0.08536319732666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,32,power_law_1.2,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,32,power_law_1.2,0.10977280139923096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,32,power_law_1.2,0.1574720025062561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,32,power_law_1.2,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,32,power_law_1.2,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,32,power_law_1.2,0.3092479944229126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,32,power_law_1.2,0.4603775978088379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,32,power_law_1.2,0.5611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,32,power_law_1.2,0.9672703742980957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,32,power_law_1.2,1.4073856353759766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,32,power_law_1.2,2.31014404296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,32,power_law_1.2,2.670796775817871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,32,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,32,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,32,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,32,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,32,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,32,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,32,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,32,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,32,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,32,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,32,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,32,power_law_1.2,0.024979199469089507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,32,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,32,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,32,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,32,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,32,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,32,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,32,power_law_1.01,0.027225598692893982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,32,power_law_1.01,0.02948479950428009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,32,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,32,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,32,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,32,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,32,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,32,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,32,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,32,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,32,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,32,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,32,power_law_1.01,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,32,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,32,power_law_1.2,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,32,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,32,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,32,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,32,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,32,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,32,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,32,power_law_1.01,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,32,power_law_1.01,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,32,power_law_1.01,0.11345920562744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,32,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,32,power_law_1.01,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,32,power_law_1.2,0.11960320472717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,32,power_law_1.01,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,32,power_law_1.01,0.6406144142150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,32,power_law_1.01,1.0680319786071777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,32,power_law_1.2,0.2332672119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,32,power_law_1.01,1.4409728050231934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,32,power_law_1.2,0.3043328046798706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,32,power_law_1.2,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,2,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,2,power_law_1.2,0.06655359864234925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,2,power_law_1.2,0.19496959447860718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,2,power_law_1.2,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,2,power_law_1.2,0.35000319480895997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,2,power_law_1.2,0.582041597366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,2,power_law_1.2,0.6017024040222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,2,power_law_1.2,0.637337589263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,2,power_law_1.2,0.6582079887390136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,2,power_law_1.2,0.6660096168518066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,2,power_law_1.2,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,2,power_law_1.2,0.7061503887176513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,2,power_law_1.2,0.7192575931549072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,2,power_law_1.2,0.7469056129455567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,2,power_law_1.2,0.7970816135406494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,2,power_law_1.2,0.8118271827697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,2,power_law_1.2,0.8556544303894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,2,power_law_1.2,0.9510720252990723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,2,power_law_1.2,1.0250240325927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,2,power_law_1.2,1.2214271545410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,2,power_law_1.2,1.4186495780944823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,2,power_law_1.2,1.8905088424682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,2,power_law_1.2,2.217977523803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,2,power_law_1.2,2.8884992599487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,2,power_law_1.2,4.144128036499024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,32,power_law_1.2,0.6952960014343261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,2,power_law_1.2,5.636505508422852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,2,power_law_1.2,7.2876029968261715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,2,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,2,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,2,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,2,power_law_1.01,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,2,power_law_1.01,0.13189120292663575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,2,power_law_1.01,0.22753279209136962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,2,power_law_1.01,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,2,power_law_1.01,0.30084478855133057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,2,power_law_1.01,0.2996223926544189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,2,power_law_1.01,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,2,power_law_1.01,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,2,power_law_1.01,0.3217407941818237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,2,power_law_1.01,0.3397631883621216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,2,power_law_1.01,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,2,power_law_1.01,0.35450880527496337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,2,power_law_1.01,0.3690176010131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,2,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,2,power_law_1.01,0.4196352005004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,2,power_law_1.01,0.46100478172302245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,2,power_law_1.01,0.5347328186035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,2,power_law_1.01,0.6287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,2,power_law_1.01,0.8425472259521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,2,power_law_1.01,1.1454463958740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,2,power_law_1.01,1.620582389831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,2,power_law_1.01,2.0002815246582033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,2,power_law_1.01,3.1078399658203124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,2,power_law_1.01,4.068352127075196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,32,power_law_1.01,0.020883199572563172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,32,power_law_1.01,0.020070399343967437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,32,power_law_1.01,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,32,power_law_1.01,0.020275199413299562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,32,power_law_1.01,0.020479999482631683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,32,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,32,power_law_1.01,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,32,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,32,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,32,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,32,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,32,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,1,balanced,0.0336053321758906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,32,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,1,balanced,0.23347200949986777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,1,balanced,0.44544001420338947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,32,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,1,balanced,0.868181308110555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,32,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,32,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,1,balanced,1.707690715789795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,32,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,1,balanced,1.7160533269246419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,1,balanced,1.7211732864379883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,1,balanced,1.7283412615458171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,1,balanced,1.7366879781087239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,1,balanced,1.7418239911397297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,32,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,32,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,1,balanced,1.7532587051391602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,32,power_law_1.01,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,1,balanced,1.7749333381652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,32,power_law_1.01,0.08110079765319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,1,balanced,1.788416067759196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,32,power_law_1.01,0.10035200119018554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,32,power_law_1.01,0.14479360580444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,1,balanced,1.819818655649821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,32,power_law_1.01,0.22323200702667237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,1,balanced,1.882794698079427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,32,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,1,balanced,1.9030772844950359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,1,balanced,1.940992037455241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,1,balanced,1.9188052813212078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,1,balanced,2.0225706100463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,1,balanced,2.141866683959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,32,power_law_1.01,0.5861375808715821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,1,balanced,2.290005366007487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,1,balanced,2.5893227259318032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,1,balanced,2.846037228902181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,1,balanced,3.574101448059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,1,balanced,4.591242790222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,1,balanced,6.854656219482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,1,balanced,8.971434911092123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,8,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,8,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,8,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,8,power_law_1.2,0.09175040125846863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,8,power_law_1.2,0.11570559740066529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,8,power_law_1.2,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,8,power_law_1.2,0.1597440004348755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,8,power_law_1.2,0.12062720060348511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,8,power_law_1.2,0.1771456003189087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,8,power_law_1.2,0.159334397315979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,8,power_law_1.2,0.18534400463104247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,8,power_law_1.2,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,8,power_law_1.2,0.21646080017089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,8,power_law_1.2,0.2263040065765381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,8,power_law_1.2,0.23324799537658691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,8,power_law_1.2,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,8,power_law_1.2,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,8,power_law_1.2,0.2924544095993042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,8,power_law_1.2,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,8,power_law_1.2,0.4253695964813232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,8,power_law_1.2,0.4892672061920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,8,power_law_1.2,0.7006207942962647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,8,power_law_1.2,1.043660831451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,8,power_law_1.2,1.3348671913146972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,8,power_law_1.2,1.942732810974121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,8,power_law_1.2,2.9007871627807615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,8,power_law_1.2,0.3540992021560669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,8,power_law_1.2,0.6580160140991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,8,power_law_1.2,0.7192319869995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,8,power_law_1.2,0.8687616348266601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,8,power_law_1.2,1.0866687774658204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,8,power_law_1.2,0.8415231704711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,8,power_law_1.2,1.0518527984619142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,8,power_law_1.2,1.1423744201660155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,8,power_law_1.2,1.0395648002624511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,8,power_law_1.2,1.17391357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,8,power_law_1.2,1.1397120475769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,8,power_law_1.2,1.1488960266113282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,8,power_law_1.2,1.1356160163879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,8,power_law_1.2,1.265664005279541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,8,power_law_1.2,1.2183551788330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,8,power_law_1.2,1.242086410522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,8,power_law_1.2,1.3152064323425292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,8,power_law_1.2,1.3836288452148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,8,power_law_1.2,1.38154878616333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,8,power_law_1.2,1.509171199798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,8,power_law_1.2,1.841766357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,8,power_law_1.2,2.1981184005737306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,8,power_law_1.2,2.3160831451416017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,8,power_law_1.2,2.8899328231811525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,8,power_law_1.2,3.6876289367675783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,8,power_law_1.2,4.881407928466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,8,power_law_1.2,4.2323966979980465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,8,power_law_1.2,5.9490303039550785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,32,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,32,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,32,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,32,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,32,power_law_1.2,0.05262719988822937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,32,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,32,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,32,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,32,power_law_1.2,0.0542527973651886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,32,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,32,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,32,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,32,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,32,power_law_1.2,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,32,power_law_1.2,0.10792959928512573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,32,power_law_1.2,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,32,power_law_1.2,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,32,power_law_1.2,0.22118399143218995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,8,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,8,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,32,power_law_1.2,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,32,power_law_1.2,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,8,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,8,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,32,power_law_1.2,0.35635199546813967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,8,power_law_1.01,0.037676799297332766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,8,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,32,power_law_1.2,0.4798463821411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,32,power_law_1.2,0.6172671794891358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,32,power_law_1.2,0.9730048179626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,8,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,32,power_law_1.2,1.5370240211486816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,8,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,8,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,8,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,8,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,8,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,32,power_law_1.2,2.404351997375488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,8,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,8,power_law_1.01,0.05138559937477112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,8,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,8,power_law_1.01,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,8,power_law_1.01,0.08436480164527893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,8,power_law_1.01,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,32,power_law_1.2,3.3138687133789064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,8,power_law_1.01,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,8,power_law_1.01,0.32727038860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,8,power_law_1.01,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,8,power_law_1.01,0.6604800224304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,8,power_law_1.01,1.075814437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,8,power_law_1.01,1.6095232009887694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,8,power_law_1.01,2.428313636779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,8,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,8,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,8,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,8,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,8,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,8,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,8,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,8,power_law_1.2,0.042368000745773314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,8,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,8,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,8,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,8,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,8,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,8,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,8,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,8,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,8,power_law_1.2,0.09687039852142335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,8,power_law_1.2,0.12165119647979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,8,power_law_1.2,0.24391679763793944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,8,power_law_1.2,0.3278464078903198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,8,power_law_1.2,0.501964807510376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,8,power_law_1.2,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,8,power_law_1.2,1.1069439888000487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,8,power_law_1.2,1.6211967468261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,4,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,4,power_law_1.01,0.03808000087738037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,4,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,4,power_law_1.01,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,4,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,4,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,4,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,4,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,4,power_law_1.01,0.05630720257759094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,4,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,4,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,4,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,4,power_law_1.01,0.08212479948997498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,4,power_law_1.01,0.1265663981437683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,4,power_law_1.01,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,4,power_law_1.01,0.15011839866638182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,4,power_law_1.01,0.16524159908294678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,4,power_law_1.01,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,4,power_law_1.01,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,4,power_law_1.01,0.42945280075073244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,4,power_law_1.01,0.575270414352417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,4,power_law_1.01,0.8488960266113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,4,power_law_1.01,1.3412351608276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,8,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,8,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,8,power_law_1.2,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,8,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,8,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,8,power_law_1.2,0.18944000005722045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,8,power_law_1.2,0.16486400365829468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,8,power_law_1.2,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,8,power_law_1.2,0.15523840188980104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,8,power_law_1.2,0.14970879554748534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,8,power_law_1.2,0.17612799406051635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,8,power_law_1.2,0.1533951997756958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,8,power_law_1.2,0.19292160272598266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,8,power_law_1.2,0.19537919759750366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,8,power_law_1.2,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,8,power_law_1.2,0.20111360549926757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,8,power_law_1.2,0.21278719902038573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,8,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,8,power_law_1.2,0.28752639293670657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,8,power_law_1.2,0.3536895990371704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,8,power_law_1.2,0.40079360008239745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,8,power_law_1.2,0.7170048236846924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,8,power_law_1.2,0.9484288215637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,8,power_law_1.2,1.379532814025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,8,power_law_1.2,2.1555200576782227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,8,power_law_1.2,2.838323211669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,8,power_law_1.2,4.29854736328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,4,power_law_1.01,1.8868223190307618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,4,power_law_1.01,2.355404853820801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,1,balanced,1.0627413590749104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,1,balanced,2.085888067881266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,1,balanced,4.028554598490397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,1,balanced,8.002389272054037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,1,balanced,15.933099110921225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,1,balanced,31.799636840820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,1,balanced,47.71447245279948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,1,balanced,0.8159573078155518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,1,balanced,1.5631359418233235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,1,balanced,47.74229431152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,1,balanced,2.7972160975138345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,1,balanced,5.524991989135742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,1,balanced,10.82419204711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,1,balanced,15.969083150227865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,1,balanced,47.76701863606771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,1,balanced,16.03497060139974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,1,balanced,16.08635711669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,1,balanced,16.140628814697266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,1,balanced,47.79366556803385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,4,power_law_1.01,3.445964813232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,1,balanced,16.195584615071613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,1,balanced,16.29320017496745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,1,balanced,16.38314692179362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,16,power_law_1.01,0.39628798961639405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,1,balanced,47.87251281738281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,16,power_law_1.01,0.5586175918579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,16,power_law_1.01,0.5421055793762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,16,power_law_1.01,0.5556223869323731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,16,power_law_1.01,0.5140480041503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,1,balanced,16.47308858235677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,16,power_law_1.01,0.5554111957550049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,16,power_law_1.01,0.47411198616027833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,16,power_law_1.01,0.510969591140747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,16,power_law_1.01,0.5316544055938721
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,16,power_law_1.01,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,16,power_law_1.01,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,16,power_law_1.01,0.5404672145843505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,1,balanced,16.615765889485676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,16,power_law_1.01,0.5359615802764892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,16,power_law_1.01,0.5511168003082275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,16,power_law_1.01,0.5529600143432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,16,power_law_1.01,0.5777408123016358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,16,power_law_1.01,0.5744639873504639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,16,power_law_1.01,0.6113279819488525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,16,power_law_1.01,0.6647808074951171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,1,balanced,47.932413736979164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,1,balanced,16.767658233642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,16,power_law_1.01,0.7563263893127441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,16,power_law_1.01,0.871833610534668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,16,power_law_1.01,1.2101632118225099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,16,power_law_1.01,1.3033472061157227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,1,balanced,16.903509775797527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,16,power_law_1.01,1.8477056503295899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,16,power_law_1.01,2.322431945800781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,16,power_law_1.01,3.2677886962890623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,1,balanced,17.133055369059246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,16,power_law_1.01,4.472217559814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,1,balanced,47.98890686035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,1,balanced,17.570288340250652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,1,balanced,18.01898701985677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,1,balanced,19.573076883951824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,1,balanced,48.11076354980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,1,balanced,19.57256571451823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,4,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,4,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,4,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,4,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,4,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,4,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,4,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,4,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,4,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,4,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,4,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,4,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,4,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,4,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,4,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,4,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,4,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,4,balanced,0.09864532947540283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,1,balanced,48.22391255696615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,4,balanced,0.09215999643007915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,4,balanced,0.15820800264676413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,1,balanced,20.693504333496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,4,balanced,0.17322667439778647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,4,balanced,0.33433600266774494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,4,balanced,0.5024426778157552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,4,balanced,0.7255040009816488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,4,balanced,1.0142719745635986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,1,balanced,21.967702229817707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,1,balanced,48.31693013509115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,1,balanced,27.3068364461263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,4,power_law_1.01,4.7783935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,1,balanced,30.35443115234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,1,balanced,48.544087727864586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,1,balanced,42.1744639078776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,1,balanced,48.98133341471354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,1,balanced,54.90977986653646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,1,balanced,50.82931009928385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,1,balanced,51.718658447265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,8,power_law_1.01,0.5193727970123291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,1,balanced,53.030059814453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,8,power_law_1.01,0.5185535907745361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,8,power_law_1.01,0.5195775985717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,8,power_law_1.01,0.5206016063690185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,8,power_law_1.01,0.522649621963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,8,power_law_1.01,0.5349376201629639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,8,power_law_1.01,0.7405568122863769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,8,power_law_1.01,0.8175616264343262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,8,power_law_1.01,0.8966143608093262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,8,power_law_1.01,0.9660415649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,8,power_law_1.01,0.9160703659057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,8,power_law_1.01,1.0035200119018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,8,power_law_1.01,1.316864013671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,8,power_law_1.01,1.5544320106506349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,8,power_law_1.01,2.2851583480834963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,8,power_law_1.01,2.6630144119262695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,8,power_law_1.01,2.8233728408813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,1,balanced,54.62389119466146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,8,power_law_1.01,4.085145568847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,8,power_law_1.01,5.2234241485595705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,8,power_law_1.01,7.044505310058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,1,balanced,62.73245747884115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,8,power_law_1.01,8.155731201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,8,power_law_1.01,10.59509735107422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,8,power_law_1.01,13.241343688964843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,8,power_law_1.01,15.461170959472657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,1,balanced,107.85689290364583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,1,balanced,65.63720703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,8,power_law_1.01,21.866085815429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,1,balanced,75.0204569498698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,16,power_law_1.2,0.5955584049224854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,16,power_law_1.2,1.0213376045227052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,16,power_law_1.2,0.8824831962585449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,16,power_law_1.2,1.0174464225769042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,16,power_law_1.2,1.0299391746520996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,16,power_law_1.2,0.759603214263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,16,power_law_1.2,0.951091194152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,16,power_law_1.2,0.9318400382995605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,16,power_law_1.2,0.9588735580444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,16,power_law_1.2,1.0000384330749512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,16,power_law_1.2,0.991436767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,16,power_law_1.2,0.9844736099243164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,16,power_law_1.2,0.9662464141845704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,16,power_law_1.2,0.9844736099243164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,16,power_law_1.2,0.9828351974487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,16,power_law_1.2,1.033011245727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,16,power_law_1.2,1.0713088035583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,16,power_law_1.2,1.1722751617431642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,16,power_law_1.2,1.216921615600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,16,power_law_1.2,1.3834239959716796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,16,power_law_1.2,1.5703935623168945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,16,power_law_1.2,2.024038314819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,16,power_law_1.2,2.2378496170043944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,1,balanced,84.75392150878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,16,power_law_1.2,3.427532958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,16,power_law_1.2,4.595711898803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,16,power_law_1.2,6.676480102539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,16,power_law_1.2,7.34576644897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,32,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,32,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,32,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,32,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,32,power_law_1.2,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,32,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,32,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,32,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,32,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,32,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,32,power_law_1.2,0.0331712007522583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,32,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,32,power_law_1.2,0.0403328001499176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,32,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,32,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,32,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,32,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,32,power_law_1.2,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,32,power_law_1.2,0.09318400025367737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,32,power_law_1.2,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,8,power_law_1.01,27.943936157226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,32,power_law_1.2,0.23306241035461425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,32,power_law_1.2,0.35184640884399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,32,power_law_1.2,0.47226881980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,32,power_law_1.2,0.7458816051483155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,32,power_law_1.2,0.9363455772399902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,32,power_law_1.2,1.738547134399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,8,power_law_1.01,33.99966735839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,32,power_law_1.2,2.246860885620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,64,power_law_1.2,0.6008831977844238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,64,power_law_1.2,0.540876817703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,64,power_law_1.2,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,64,power_law_1.2,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,64,power_law_1.2,0.4419583797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,64,power_law_1.2,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,64,power_law_1.2,0.5238719940185547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,64,power_law_1.2,0.5525504112243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,64,power_law_1.2,0.5277696132659913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,64,power_law_1.2,0.530617618560791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,64,power_law_1.2,0.5599232196807862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,64,power_law_1.2,0.5464064121246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,64,power_law_1.2,0.49232001304626466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,64,power_law_1.2,0.5259263992309571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,64,power_law_1.2,0.6146048069000244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,64,power_law_1.2,0.6020864009857178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,64,power_law_1.2,0.6176767826080323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,64,power_law_1.2,0.7497727870941162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,64,power_law_1.2,0.8101887702941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,64,power_law_1.2,1.0070015907287597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,64,power_law_1.2,1.3180928230285645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,64,power_law_1.2,1.9990528106689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,64,power_law_1.2,2.489958381652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,64,power_law_1.2,3.463372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,64,power_law_1.2,4.612710571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,64,power_law_1.2,7.697203063964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,64,power_law_1.2,11.984678649902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,1,balanced,0.04641599953174591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,1,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,1,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,1,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,1,balanced,0.1508693297704061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,1,balanced,0.35259731610616046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,1,balanced,0.35549867153167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,1,balanced,0.36078933874766034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,1,balanced,0.36556800206502277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,1,balanced,0.37017067273457843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,1,balanced,0.3787093162536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,1,balanced,0.3858773310979207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,1,balanced,0.3930453459421794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,1,balanced,0.407039999961853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,1,balanced,0.4212053219477336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,1,balanced,0.43485867977142334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,1,balanced,0.45721598466237384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,1,balanced,0.5155839920043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,1,balanced,0.5857280095418295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,1,balanced,0.7581013043721517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,1,balanced,0.9453226725260416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,1,balanced,1.3276159763336182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,1,balanced,1.7020586331685383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,1,balanced,2.4808106422424316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,1,balanced,3.2989867528279624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,1,balanced,4.990805308024089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,1,balanced,6.660266876220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,16,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,16,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,16,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,16,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,16,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,16,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,16,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,16,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,16,power_law_1.01,0.024160000681877136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,16,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,16,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,16,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,16,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,16,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,16,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,16,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,16,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,16,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,16,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,16,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,16,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,16,power_law_1.01,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,16,power_law_1.01,0.11489280462265014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,16,power_law_1.01,0.2510848045349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,16,power_law_1.01,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,16,power_law_1.01,0.4497407913208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,16,power_law_1.01,0.6809599876403809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,16,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,16,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,16,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,16,balanced,0.042133331298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,16,balanced,0.0448586642742157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,16,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,16,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,16,balanced,0.047930667797724404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,16,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,16,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,16,balanced,0.04948266843954722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,16,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,16,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,16,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,16,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,16,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,16,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,16,balanced,0.07611733178297679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,16,balanced,0.09727999567985535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,16,balanced,0.21794132391611734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,16,balanced,0.2617759903271993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,16,balanced,0.3341653347015381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,16,balanced,0.40669866402943927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,16,balanced,0.6048426628112793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,16,balanced,0.8313173453013102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,16,balanced,1.246549367904663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,16,balanced,1.6537599563598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,8,power_law_1.2,0.6273024082183838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,8,power_law_1.2,0.7829504013061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,8,power_law_1.2,0.9400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,8,power_law_1.2,0.963584041595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,8,power_law_1.2,1.0530816078186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,8,power_law_1.2,1.2480511665344238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,8,power_law_1.2,1.1980799674987792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,8,power_law_1.2,1.3496319770812988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,8,power_law_1.2,1.32423677444458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,8,power_law_1.2,1.2617728233337402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,8,power_law_1.2,1.3090815544128418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,8,power_law_1.2,1.4161727905273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,8,power_law_1.2,1.3840383529663085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,8,power_law_1.2,1.431340789794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,8,power_law_1.2,1.4960639953613282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,8,power_law_1.2,1.507737636566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,8,power_law_1.2,1.4845952033996581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,8,power_law_1.2,1.6128000259399413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,8,power_law_1.2,1.7758207321166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,8,power_law_1.2,1.9787776947021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,8,power_law_1.2,2.452479934692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,8,power_law_1.2,3.3896446228027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,8,power_law_1.2,3.3282047271728517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,8,power_law_1.2,4.384153747558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,8,power_law_1.2,5.459148788452149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,8,power_law_1.2,10.194329833984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,8,power_law_1.2,9.847193908691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,4,power_law_1.2,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,4,power_law_1.2,0.5298175811767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,4,power_law_1.2,0.47411198616027833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,4,power_law_1.2,0.5298175811767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,4,power_law_1.2,0.5273536205291748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,4,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,4,power_law_1.2,0.5429247856140137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,4,power_law_1.2,0.6033408164978027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,4,power_law_1.2,0.6914048194885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,4,power_law_1.2,0.7497727870941162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,4,power_law_1.2,0.662937593460083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,4,power_law_1.2,0.7368703842163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,4,power_law_1.2,0.7903232097625732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,4,power_law_1.2,1.0149888038635253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,4,power_law_1.2,1.0393600463867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,4,power_law_1.2,1.1714559555053712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,4,power_law_1.2,1.3408255577087402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,4,power_law_1.2,1.7074176788330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,4,power_law_1.2,1.8384895324707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,4,power_law_1.2,2.245625686645508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,4,power_law_1.2,2.854502487182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,4,power_law_1.2,3.8424510955810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,4,power_law_1.2,4.757503890991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,16,power_law_1.2,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,16,power_law_1.2,0.13537280559539794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,16,power_law_1.2,0.2095103979110718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,16,power_law_1.2,0.25128960609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,16,power_law_1.2,0.1994752049446106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,16,power_law_1.2,0.19578880071640015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,16,power_law_1.2,0.2396159887313843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,16,power_law_1.2,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,16,power_law_1.2,0.23900160789489747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,16,power_law_1.2,0.22650880813598634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,16,power_law_1.2,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,16,power_law_1.2,0.2545664072036743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,16,power_law_1.2,0.24842240810394287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,16,power_law_1.2,0.2508543968200684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,16,power_law_1.2,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,16,power_law_1.2,0.2539391994476318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,16,power_law_1.2,0.2695168018341064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,16,power_law_1.2,0.27013120651245115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,16,power_law_1.2,0.2940608024597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,16,power_law_1.2,0.35061120986938477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,16,power_law_1.2,0.39403519630432127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,16,power_law_1.2,0.5591040134429932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,16,power_law_1.2,0.6146048069000244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,16,power_law_1.2,0.8409088134765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,16,power_law_1.2,1.2433407783508301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,16,power_law_1.2,1.8522111892700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,4,power_law_1.2,6.363545608520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,16,power_law_1.2,2.4922111511230467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,2,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,2,balanced,0.21589332818984985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,2,balanced,0.4331520001093547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,2,balanced,0.766266663869222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,2,balanced,1.4385493596394856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,2,balanced,2.08298667271932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,2,balanced,2.0927146275838218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,2,balanced,2.103125254313151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,2,balanced,2.118293285369873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,2,balanced,2.128554662068685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,2,balanced,2.1481812795003257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,2,balanced,2.171903928120931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,2,balanced,2.1925546328226724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,2,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,2,balanced,2.23691733678182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,2,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,2,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,2,balanced,0.07645866771539052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,2,balanced,0.2792106668154399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,2,balanced,0.53111465771993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,2,balanced,2.2809599240620932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,2,balanced,0.7787520090738932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,2,balanced,0.7828479607899984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,2,balanced,2.324138641357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,2,balanced,0.7871146996816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,2,balanced,0.7934292952219645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,2,balanced,0.8023040294647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,2,balanced,2.4019625981648765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,2,balanced,0.8137386639912924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,2,balanced,0.8241493701934814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,2,balanced,2.532693386077881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,2,balanced,0.8463359673817953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,2,balanced,0.8652799924214681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,2,balanced,0.8835306962331136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,2,balanced,2.662058671315511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,2,balanced,0.932522694269816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,2,balanced,1.0195626417795818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,2,balanced,2.956629435221354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,2,balanced,1.1625813643137615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,2,balanced,1.3738667170206706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,2,balanced,3.2701441446940103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,2,balanced,1.6131253242492676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,2,balanced,2.14630397160848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,2,balanced,3.896474520365397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,2,balanced,2.6289493242899575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,2,balanced,4.659712155659993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,2,balanced,3.650730768839518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,2,balanced,4.572330792744954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,2,balanced,6.295210520426433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,2,balanced,6.58244260152181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,2,balanced,7.671125411987305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,2,balanced,8.495786666870117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,2,balanced,10.892288208007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,2,balanced,14.126932779947916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,4,power_law_1.2,8.348876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,4,power_law_1.2,11.898675537109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,2,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,2,balanced,0.0766186664501826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,2,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,2,balanced,0.5319679975509644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,2,balanced,1.0373120307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,2,balanced,2.0348587036132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,2,balanced,2.043733278910319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,2,balanced,2.050901254018148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,2,balanced,2.060800075531006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,2,balanced,2.0653813680013022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,2,balanced,2.0802559852600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,2,balanced,2.0964694023132324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,2,balanced,2.111146608988444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,2,balanced,2.1415252685546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,2,balanced,2.1661012967427573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,2,balanced,2.190336068471273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,2,balanced,2.2493866284688315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,2,balanced,2.3905280431111655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,2,balanced,2.495317300160726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,2,balanced,2.708650588989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,2,balanced,2.9690879185994468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,2,balanced,3.3887573877970376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,2,balanced,3.908778508504232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,2,balanced,5.107370694478353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,2,balanced,5.965141296386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,2,balanced,8.30395762125651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,2,balanced,10.16695467631022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,4,power_law_1.2,15.348326110839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,2,balanced,0.39099733034769696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,4,balanced,0.07048533360163371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,2,balanced,0.762880007425944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,4,balanced,0.27818665901819867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,4,balanced,0.53111465771993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,2,balanced,1.448618729909261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,4,balanced,1.037823994954427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,4,balanced,2.070869286855062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,2,balanced,2.907125473022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,4,balanced,4.020223935445149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,2,balanced,5.587455749511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,4,balanced,5.972650527954102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,2,balanced,8.01040013631185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,4,balanced,6.01634152730306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,2,balanced,8.040096282958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,4,balanced,6.024192174275716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,2,balanced,8.06929079691569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,4,balanced,6.021973292032878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,2,balanced,8.096426645914713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,4,balanced,6.048074722290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,2,balanced,8.122709274291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,4,balanced,6.056608200073242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,4,balanced,6.074709574381511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,2,balanced,8.166229248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,4,balanced,6.061738967895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,2,balanced,8.213674545288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,4,balanced,6.083413441975911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,2,balanced,8.255488077799479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,4,balanced,6.110720316569011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,4,balanced,6.152704238891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,2,balanced,8.33518918355306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,4,balanced,6.257322947184245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,2,balanced,8.405824025472006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,4,balanced,6.514346440633138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,8,power_law_1.2,0.19394559860229493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,2,balanced,8.472405115763346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,8,power_law_1.2,0.34754559993743894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,4,balanced,6.684672037760417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,8,power_law_1.2,0.346726393699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,8,power_law_1.2,0.5083136081695556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,8,power_law_1.2,0.5337088108062744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,2,balanced,8.589141209920248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,4,balanced,6.811306635538737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,8,power_law_1.2,0.5240831851959229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,8,power_law_1.2,0.561356782913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,8,power_law_1.2,0.5619711875915527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,4,balanced,7.121226628621419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,8,power_law_1.2,0.6045695781707764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,128,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,2,balanced,8.81544558207194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,128,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,8,power_law_1.2,0.6000639915466308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,128,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,128,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,8,power_law_1.2,0.6023168087005615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,128,power_law_1.2,0.024774399399757386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,8,power_law_1.2,0.6064127922058106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,128,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,128,power_law_1.2,0.02558720111846924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,4,balanced,8.698026657104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,8,power_law_1.2,0.6113279819488525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,128,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,2,balanced,9.036799748738607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,128,power_law_1.2,0.025561600923538208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,8,power_law_1.2,0.6197247982025147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,128,power_law_1.2,0.02597759962081909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,128,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,8,power_law_1.2,0.6393727779388427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,128,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,8,power_law_1.2,0.6311935901641845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,128,power_law_1.2,0.027423998713493346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,128,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,8,power_law_1.2,0.6715392112731934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,128,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,4,balanced,8.384170532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,128,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,8,power_law_1.2,0.7145472049713135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,128,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,2,balanced,9.772202809651693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,128,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,8,power_law_1.2,0.735641622543335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,128,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,128,power_law_1.2,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,8,power_law_1.2,0.8079360008239747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,8,power_law_1.2,0.9658368110656739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,4,balanced,8.447829564412435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,128,power_law_1.2,0.09584640264511109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,8,power_law_1.2,1.1149184226989746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,2,balanced,9.794389088948568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,8,power_law_1.2,1.3015040397644042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,128,power_law_1.2,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,8,power_law_1.2,1.6887807846069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,4,balanced,10.574335734049479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,128,power_law_1.2,0.19290879964828492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,8,power_law_1.2,2.166169548034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,2,balanced,10.431317647298178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,128,power_law_1.2,0.3239936113357544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,8,power_law_1.2,3.382271957397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,4,balanced,11.43176523844401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,2,balanced,11.065685272216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,8,power_law_1.2,3.805388641357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,2,balanced,13.77347183227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,2,balanced,15.638010660807291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,128,power_law_1.2,0.4827136039733887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,2,balanced,24.093526204427082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,2,balanced,27.004074096679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,2,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,2,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,2,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,2,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,2,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,16,power_law_1.01,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,2,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,2,power_law_1.01,0.03767040073871612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,16,power_law_1.01,0.5400576114654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,2,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,2,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,2,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,16,power_law_1.01,0.8081215858459473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,2,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,2,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,16,power_law_1.01,0.7913472175598144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,2,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,2,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,16,power_law_1.01,0.788479995727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,16,power_law_1.01,0.7241727828979492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,2,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,16,power_law_1.01,0.6883327960968018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,2,power_law_1.01,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,16,power_law_1.01,0.7393280029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,16,power_law_1.01,0.6821887969970704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,2,power_law_1.01,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,16,power_law_1.01,0.643071985244751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,16,power_law_1.01,0.6942719936370849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,16,power_law_1.01,0.6651904106140136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,2,power_law_1.01,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,16,power_law_1.01,0.667033576965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,16,power_law_1.01,0.7534592151641846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,2,power_law_1.01,0.1275904059410095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,16,power_law_1.01,0.7489535808563232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,16,power_law_1.01,0.7181951999664307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,128,power_law_1.2,0.7427840232849121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,2,power_law_1.01,0.17694720029830932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,16,power_law_1.01,0.8247296333312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,16,power_law_1.01,0.8214336395263672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,16,power_law_1.01,0.8407039642333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,2,power_law_1.01,0.2574336051940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,16,power_law_1.01,0.9162495613098145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,16,power_law_1.01,1.0534912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,16,power_law_1.01,1.1112192153930665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,16,power_law_1.01,1.3582271575927733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,16,power_law_1.01,1.8132991790771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,16,power_law_1.01,2.240716743469238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,16,power_law_1.01,3.4543617248535154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,2,power_law_1.01,0.39239680767059326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,16,power_law_1.01,3.7599231719970705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,2,power_law_1.01,0.4730879783630371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,2,power_law_1.01,0.8257408142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,2,power_law_1.01,1.1468799591064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,128,power_law_1.2,1.0192895889282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,2,power_law_1.01,2.022809600830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,2,power_law_1.01,2.614681625366211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,32,power_law_1.01,0.3225600004196167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,32,power_law_1.01,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,32,power_law_1.01,0.29122560024261473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,32,power_law_1.01,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,32,power_law_1.01,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,32,power_law_1.01,0.27504639625549315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,32,power_law_1.01,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,32,power_law_1.01,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,32,power_law_1.01,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,32,power_law_1.01,0.2824064016342163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,32,power_law_1.01,0.27504639625549315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,32,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,32,power_law_1.01,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,32,power_law_1.01,0.29122560024261473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,32,power_law_1.01,0.3082240104675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,32,power_law_1.01,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,32,power_law_1.01,0.3229696035385132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,32,power_law_1.01,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,32,power_law_1.01,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,32,power_law_1.01,0.41103358268737794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,32,power_law_1.01,0.47759361267089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,32,power_law_1.01,0.5965824127197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,32,power_law_1.01,0.745472002029419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,32,power_law_1.01,1.2701696395874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,32,power_law_1.01,1.4792703628540038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,32,power_law_1.01,2.071347236633301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,32,power_law_1.01,2.855936050415039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,8,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,8,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,8,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,8,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,8,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,8,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,8,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,8,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,8,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,8,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,8,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,8,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,8,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,8,power_law_1.2,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,8,power_law_1.2,0.09338880181312562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,8,power_law_1.2,0.13148159980773927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,8,power_law_1.2,0.22466559410095216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,8,power_law_1.2,0.2789376020431519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,8,power_law_1.2,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,8,power_law_1.2,0.5148672103881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,8,power_law_1.2,0.7583615779876709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,8,power_law_1.2,1.1980799674987792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,8,power_law_1.2,1.7657855987548827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,64,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,64,power_law_1.2,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,64,power_law_1.2,0.060192000865936277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,64,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,64,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,64,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,64,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,64,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,64,power_law_1.2,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,64,power_law_1.2,0.05486080050468445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,64,power_law_1.2,0.0585536003112793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,64,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,64,power_law_1.2,0.0692031979560852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,64,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,64,power_law_1.2,0.08663039803504943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,64,power_law_1.2,0.1060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,2,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,2,balanced,0.17117865880330405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,64,power_law_1.2,0.1347584009170532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,2,balanced,0.3689813216527303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,2,balanced,0.7434026400248209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,64,power_law_1.2,0.20703999996185302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,2,balanced,1.3702826499938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,64,power_law_1.2,0.2451456069946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,64,power_law_1.2,0.3022847890853882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,64,power_law_1.2,0.3852288007736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,64,power_law_1.2,0.5419007778167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,2,balanced,1.8629973729451497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,2,balanced,1.86845858891805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,64,power_law_1.2,0.6121471881866455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,2,balanced,1.8744319279988606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,2,balanced,1.8797225952148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,64,power_law_1.2,0.9043968200683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,2,balanced,1.8826239903767903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,2,balanced,1.8908054033915203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,2,balanced,1.8981547355651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,64,power_law_1.2,1.3385727882385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,2,balanced,1.9068586031595867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,2,balanced,1.9201706250508626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,2,balanced,1.9365545908610027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,2,balanced,1.9474773406982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,64,power_law_1.2,2.2566911697387697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,2,balanced,1.9694933891296387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,2,balanced,2.002602736155192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,2,balanced,2.041855971018473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,2,balanced,2.080570697784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,2,balanced,2.1550079981486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,64,power_law_1.2,3.212492752075195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,2,balanced,2.3191893895467124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,2,balanced,2.49617067972819
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,2,balanced,2.844501177469889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,2,balanced,3.230208079020182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,2,balanced,4.453717231750488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,2,balanced,5.43556276957194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,1,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,1,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,1,power_law_1.2,0.06777600049972535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,1,power_law_1.2,0.1419263958930969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,1,power_law_1.2,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,1,power_law_1.2,0.38645761013031005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,1,power_law_1.2,0.4050943851470947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,1,power_law_1.2,0.4157440185546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,1,power_law_1.2,0.4325376033782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,1,power_law_1.2,0.43868160247802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,1,power_law_1.2,0.45240321159362795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,1,power_law_1.2,0.4708096027374268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,1,power_law_1.2,0.4724736213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,1,power_law_1.2,0.47861762046813966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,1,power_law_1.2,0.4833280086517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,1,power_law_1.2,0.4880383968353271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,1,power_law_1.2,0.5167103767395019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,1,power_law_1.2,0.5576704025268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.6115327835083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.7202816009521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.8849408149719238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,1,power_law_1.2,1.1692031860351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,1,power_law_1.2,1.3914112091064452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,1,power_law_1.2,1.926348876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,1,power_law_1.2,2.3945087432861327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,1,power_law_1.2,3.5579902648925783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,1,power_law_1.2,4.717977523803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,4,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,4,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,4,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,4,balanced,0.03719466676314672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,4,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,4,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,4,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,4,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,4,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,4,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,4,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,4,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,4,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,4,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,4,balanced,0.07679999868075053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,4,balanced,0.16537599762280783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,4,balanced,0.19319466749827066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,4,balanced,0.23688000440597534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,4,balanced,0.2950826684633891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,4,balanced,0.3991893529891968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,4,balanced,0.5440853436787924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,4,balanced,0.9197226365407308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,4,balanced,1.26583464940389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,4,balanced,1.9780267079671223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,4,balanced,2.626901308695475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.08417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.47902722358703614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.693452787399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.801363182067871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,1,power_law_1.01,1.0459136009216308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,1,power_law_1.01,1.094655990600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,1,power_law_1.01,1.143603229522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,1,power_law_1.01,1.1821056365966798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,1,power_law_1.01,1.2793855667114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,1,power_law_1.01,1.3189120292663574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,1,power_law_1.01,1.4036992073059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,1,power_law_1.01,1.469644832611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,1,power_law_1.01,1.5196160316467284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,1,power_law_1.01,1.6523199081420898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,1,power_law_1.01,1.863065528869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,1,power_law_1.01,2.0958911895751955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,1,power_law_1.01,2.509414482116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,1,power_law_1.01,2.993734359741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,1,power_law_1.01,3.871129608154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,1,power_law_1.01,4.793344116210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,1,power_law_1.01,6.689382171630859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,1,power_law_1.01,8.498579406738282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,1,power_law_1.01,12.21427230834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,1,power_law_1.01,15.898828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,1,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,1,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,1,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,1,balanced,0.2384213407834371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,1,balanced,0.45431466897328693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,1,balanced,0.4582293430964152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,1,balanced,0.46353065967559814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,1,balanced,0.46967466672261554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,1,balanced,0.4739413261413574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,1,balanced,0.47786664962768555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,1,balanced,0.4886186520258586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,1,balanced,0.49937065442403156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,1,balanced,0.5085866848627726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,1,balanced,0.5253119866053263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,1,balanced,0.5427093505859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,1,balanced,0.5642240047454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,1,balanced,0.6050133307774862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,1,balanced,0.6732800006866455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,1,balanced,0.7789226373036703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,1,balanced,0.9454933007558187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,1,balanced,1.1496106783548992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,1,balanced,1.5872000058492024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,1,balanced,1.9628373781840007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,1,balanced,2.7419306437174478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,1,balanced,3.5493545532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,1,balanced,5.340159734090169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,1,balanced,7.085056304931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,1,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,1,power_law_1.2,0.3028991937637329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,1,power_law_1.2,0.5339136123657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,1,power_law_1.2,1.0225664138793946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,1,power_law_1.2,1.6351232528686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,1,power_law_1.2,2.434867286682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,1,power_law_1.2,2.738585662841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,1,power_law_1.2,3.8121471405029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,1,power_law_1.2,4.037222290039063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,1,power_law_1.2,4.155801773071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,1,power_law_1.2,4.372889709472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,1,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,1,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,1,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,1,balanced,0.2379093368848165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,1,balanced,0.45395731925964355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,1,balanced,0.45550934473673504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,1,balanced,0.45737600326538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,1,balanced,0.46301865577697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,1,balanced,0.46590932210286456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,1,balanced,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,1,balanced,0.474453330039978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,1,balanced,0.48128000895182294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,1,power_law_1.2,4.5070335388183596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,1,balanced,0.48622934023539227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,1,balanced,0.49851731459299725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,1,balanced,0.5099519888559977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,1,balanced,0.5207039912541708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,1,balanced,0.5348693529764811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,1,balanced,0.5794080098470052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,1,balanced,0.6285653511683146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,1,balanced,0.7188479900360107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,1,power_law_1.2,4.651609420776367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,1,balanced,0.8360959688822428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,1,balanced,1.087488015492757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,1,balanced,1.327445348103841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,1,balanced,1.8143572807312012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,1,power_law_1.2,4.877107238769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,1,balanced,2.2701919873555503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,1,balanced,3.261610666910807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,1,power_law_1.2,5.092556762695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,1,balanced,4.212736129760742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,1,power_law_1.2,5.15338249206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,1,power_law_1.2,5.505228805541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,1,power_law_1.2,5.733375930786133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,1,power_law_1.2,6.165504074096679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,1,power_law_1.2,6.658854675292969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,1,power_law_1.2,7.160012817382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,1,power_law_1.2,8.000511932373048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,1,power_law_1.2,8.83056640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,1,power_law_1.2,10.780671691894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,1,power_law_1.2,12.7098876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,1,power_law_1.2,16.8015869140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,2,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,2,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,1,power_law_1.2,20.351181030273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,2,power_law_1.2,0.027225598692893982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,2,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,2,power_law_1.2,0.029267200827598573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,2,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,2,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,2,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,2,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,2,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,2,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,2,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,2,power_law_1.2,0.04953599870204926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,2,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,2,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,2,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,2,power_law_1.2,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,2,power_law_1.2,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,2,power_law_1.2,0.13537280559539794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,2,power_law_1.2,0.21647360324859619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,2,power_law_1.2,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,32,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,32,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,32,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,32,power_law_1.01,0.02497279942035675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,32,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,32,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,32,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,32,power_law_1.01,0.02374400049448013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,32,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,32,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,32,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,32,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,32,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,32,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,32,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,32,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,32,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,32,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,32,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,32,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,32,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,32,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,32,power_law_1.01,0.02619520127773285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,32,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,32,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,32,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,32,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,32,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,32,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,32,power_law_1.01,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,32,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,32,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,32,power_law_1.01,0.07639039754867553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,32,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,32,power_law_1.01,0.09113600254058837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,32,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,32,power_law_1.01,0.1325055956840515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,32,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,32,power_law_1.01,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,32,power_law_1.01,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,32,power_law_1.01,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,32,power_law_1.01,0.3354624032974243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,32,power_law_1.01,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,32,power_law_1.01,0.13678079843521118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,32,power_law_1.01,0.4190207958221436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,32,power_law_1.01,0.3010560035705566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,32,power_law_1.01,0.7278592109680175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,32,power_law_1.01,0.4442111968994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,32,power_law_1.01,0.9689087867736816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,32,power_law_1.01,0.5675007820129394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,32,power_law_1.01,0.8148991584777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,32,power_law_1.01,1.5249407768249512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,2,power_law_1.2,0.4098048210144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,32,power_law_1.01,2.1520383834838865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,2,power_law_1.2,0.5095424175262451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,2,power_law_1.2,0.7825407981872559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,2,power_law_1.2,1.2599295616149901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,2,power_law_1.01,0.2420736074447632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,2,power_law_1.01,0.3637248039245605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,2,power_law_1.01,0.5832704067230224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,2,power_law_1.01,0.7671807765960693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,2,power_law_1.01,1.063526439666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,2,power_law_1.01,1.4749695777893066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,2,power_law_1.01,1.5210495948791505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,2,power_law_1.01,1.5939583778381348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,2,power_law_1.01,1.6123903274536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,2,power_law_1.01,1.6707584381103515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,2,power_law_1.01,1.682841682434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,2,power_law_1.01,1.6717824935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,2,power_law_1.01,1.7661951065063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,2,power_law_1.01,1.7936384201049804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,2,power_law_1.01,1.744486427307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,2,power_law_1.01,1.7682432174682616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,2,power_law_1.01,1.8548736572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,2,power_law_1.01,1.9859455108642579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,2,power_law_1.01,1.9736576080322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,2,power_law_1.01,2.3023616790771486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,2,power_law_1.01,2.439571189880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,2,power_law_1.01,3.0830591201782225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,2,power_law_1.01,3.6241409301757814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,2,power_law_1.01,5.085184097290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,2,power_law_1.01,5.787443161010742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,2,power_law_1.01,7.975116729736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,2,power_law_1.01,10.358988952636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,2,power_law_1.2,2.151628875732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,8,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,8,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,8,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,8,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,8,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,8,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,8,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,8,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,8,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,8,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,8,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,8,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,8,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,8,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,8,power_law_1.2,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,8,power_law_1.2,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,8,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,8,power_law_1.2,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,8,power_law_1.2,0.11919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,8,power_law_1.2,0.2289664030075073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,8,power_law_1.2,0.3327807903289795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,8,power_law_1.2,0.4739071846008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,8,power_law_1.2,0.8105983734130859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,8,power_law_1.2,1.2791808128356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,8,power_law_1.2,1.8747392654418946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,2,power_law_1.2,2.390220832824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,16,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,16,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,16,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,16,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,16,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,16,balanced,0.03565333286921183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,16,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,16,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,16,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,16,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,16,balanced,0.0382080003619194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,16,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,16,balanced,0.042133331298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,16,balanced,0.04332800209522247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,16,balanced,0.06619733572006226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,16,balanced,0.07116800049940745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,16,balanced,0.13738666971524557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,16,balanced,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,16,balanced,0.2285226583480835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,16,balanced,0.2706666588783264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,16,balanced,0.3285333315531413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,16,balanced,0.3947519858678182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,16,balanced,0.5661013523737589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,16,balanced,0.7702186902364095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,1,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,1,balanced,0.2752853234608968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,1,balanced,0.5285546779632568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,1,balanced,0.5259679953257242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,1,balanced,0.5273600021998087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,1,balanced,0.5319679975509644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,1,balanced,0.5350399812062582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,1,balanced,0.5381120045979818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,1,balanced,0.5471520026524862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,1,balanced,0.5488479932149252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,1,balanced,0.5548266569773356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,1,balanced,0.5602986812591553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,1,balanced,0.5642240047454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,1,balanced,0.5887999931971232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,1,balanced,0.5628586610158285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,1,balanced,0.5840213298797607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,1,balanced,0.6033066511154175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,1,balanced,0.65774933497111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,1,balanced,0.6881013711293539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,1,balanced,0.85316268603007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,1,balanced,1.0832160313924153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,1,balanced,1.5699626604715984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,1,balanced,2.131626605987549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,1,balanced,3.180543899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,1,balanced,4.1830399831136065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,1,balanced,6.299802780151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,1,balanced,8.31556256612142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,32,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,32,balanced,0.034287999073664345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,32,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,32,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,32,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,32,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,32,balanced,0.03754133234421412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,32,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,32,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,32,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,32,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,32,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,32,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,32,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,32,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,32,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,32,balanced,0.052042668064435325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,32,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,32,balanced,0.06894933183987935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,32,balanced,0.08072533210118611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,32,balanced,0.10820266604423523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,32,balanced,0.15957333644231161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,32,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,32,balanced,0.3723946809768677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,32,balanced,0.5626826683680216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,32,balanced,0.7732906341552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,16,power_law_1.2,1.1108351707458497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,16,power_law_1.2,2.007859230041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,16,power_law_1.2,1.7932287216186524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,16,power_law_1.2,2.016870307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,16,power_law_1.2,2.0692991256713866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,16,power_law_1.2,1.3103103637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,16,power_law_1.2,1.7002496719360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,16,power_law_1.2,1.8216960906982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,16,power_law_1.2,1.855276870727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,16,power_law_1.2,1.7366975784301757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,16,power_law_1.2,1.8722816467285157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,16,power_law_1.2,1.758412742614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,4,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,16,power_law_1.2,1.8219007492065429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,4,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,4,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,4,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,16,power_law_1.2,1.8368511199951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,4,power_law_1.01,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,4,power_law_1.01,0.21319680213928222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,16,power_law_1.2,2.101043128967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,16,power_law_1.2,2.1934080123901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,16,power_law_1.2,2.157561683654785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,4,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,4,power_law_1.01,0.2371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,4,power_law_1.01,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,16,power_law_1.2,2.307891273498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,4,power_law_1.01,0.22814719676971434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,4,power_law_1.01,0.24145920276641847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,4,power_law_1.01,0.2578432083129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,16,power_law_1.2,2.409267234802246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,4,power_law_1.01,0.260915207862854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,4,power_law_1.01,0.25250558853149413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,4,power_law_1.01,0.26439681053161623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,4,power_law_1.01,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,16,power_law_1.2,2.7435007095336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,4,power_law_1.01,0.2846719980239868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,4,power_law_1.01,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,4,power_law_1.01,0.315391993522644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,4,power_law_1.01,0.34590721130371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,16,power_law_1.2,3.086950492858887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,4,power_law_1.01,0.37703680992126465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,4,power_law_1.01,0.43970561027526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,4,power_law_1.01,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,16,power_law_1.2,4.026777648925782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,4,power_law_1.01,0.7479296207427979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,4,power_law_1.01,0.9902079582214356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,4,power_law_1.01,1.4317567825317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,16,power_law_1.2,5.079654312133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,4,power_law_1.01,1.92040958404541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,16,power_law_1.2,7.573299407958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,16,power_law_1.2,7.617740631103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,16,power_law_1.2,9.765068817138673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,16,power_law_1.2,12.784435272216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,8,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,8,balanced,0.03463999927043915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,8,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,8,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,8,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,8,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,8,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,8,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,8,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,8,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,8,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,8,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,8,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,8,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,8,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,8,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,8,balanced,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,8,balanced,0.0718506673971812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,8,balanced,0.09489066402117412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,8,balanced,0.17322667439778647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,8,balanced,0.26265599330266315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,8,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,8,balanced,0.42803200085957843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,8,balanced,0.5493760108947754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,8,balanced,0.8480426470438639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,8,balanced,1.205077330271403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,1,power_law_1.01,0.3180543899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,1,power_law_1.01,0.5730303764343262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,1,power_law_1.01,1.100595188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,1,power_law_1.01,1.8778112411499024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,1,power_law_1.01,2.6253311157226564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,1,power_law_1.01,4.13941764831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,1,power_law_1.01,4.467916870117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,1,power_law_1.01,4.592435073852539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,1,power_law_1.01,4.655513763427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,1,power_law_1.01,4.765081787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,1,power_law_1.01,4.82344970703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,1,power_law_1.01,5.039481735229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,1,power_law_1.01,5.171814346313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,1,power_law_1.01,5.232223892211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,16,power_law_1.2,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,16,power_law_1.2,0.17592320442199708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,16,power_law_1.2,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,16,power_law_1.2,0.17223680019378662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,1,power_law_1.01,5.311078262329102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,16,power_law_1.2,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,16,power_law_1.2,0.24453120231628417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,16,power_law_1.2,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,16,power_law_1.2,0.25292799472808836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,16,power_law_1.2,0.2537472009658813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,16,power_law_1.2,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,1,power_law_1.01,5.470003128051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,16,power_law_1.2,0.24983680248260498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,16,power_law_1.2,0.2461695909500122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,16,power_law_1.2,0.25722880363464357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,16,power_law_1.2,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,16,power_law_1.2,0.2582528114318848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,1,power_law_1.01,5.547622299194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,16,power_law_1.2,0.2777087926864624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,16,power_law_1.2,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,16,power_law_1.2,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,16,power_law_1.2,0.33607680797576905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,16,power_law_1.2,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,1,power_law_1.01,5.943500900268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,16,power_law_1.2,0.5599232196807862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,16,power_law_1.2,0.7980991840362549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,1,power_law_1.01,6.085427093505859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,1,power_law_1.01,6.462258911132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,1,power_law_1.01,7.200563049316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,16,power_law_1.2,0.8114175796508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,1,power_law_1.01,8.423001861572265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,1,power_law_1.01,9.218048095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,16,power_law_1.2,1.3379584312438966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,1,power_law_1.01,12.217753601074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,1,power_law_1.01,14.332313537597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,16,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,16,balanced,0.2892799973487854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,16,balanced,0.5497173468271891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,16,balanced,1.0666666825612385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,16,balanced,1.7472853660583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,16,balanced,2.111658732096354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,16,balanced,2.1145599683125815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,16,balanced,2.088618596394857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,16,balanced,2.09169069925944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,16,balanced,2.095786730448405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,16,balanced,2.0860586166381836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,16,balanced,2.0937387148539224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,1,power_law_1.01,20.000767517089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,16,balanced,2.097983996073405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,16,balanced,2.1079039573669434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,16,balanced,2.1208747227986655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,16,balanced,2.1428906122843423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,16,balanced,2.1531306902567544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,16,balanced,2.1882665952046714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,16,balanced,2.2275412877400718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,16,balanced,2.2316373189290366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,16,balanced,2.3072266578674316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,16,balanced,2.486442724863688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,16,balanced,2.6427733103434243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,1,power_law_1.01,25.266995239257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,16,balanced,3.080874760945638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,16,balanced,3.4703359603881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,16,balanced,4.65339724222819
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,16,balanced,5.612703959147136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,16,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,16,power_law_1.2,1.7252351760864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,16,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,16,power_law_1.01,0.21770238876342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,16,power_law_1.01,0.19967999458312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,16,power_law_1.01,0.21582720279693604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,16,power_law_1.01,0.21338241100311278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,16,power_law_1.01,0.18124799728393554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,16,power_law_1.01,0.16401920318603516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,16,power_law_1.01,0.12019840478897095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,16,power_law_1.01,0.15626239776611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,16,power_law_1.01,0.18575359582901002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,16,power_law_1.01,0.1601408004760742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,16,power_law_1.01,0.1597440004348755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,16,power_law_1.01,0.19189759492874145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,16,power_law_1.01,0.19352320432662964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,16,power_law_1.01,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,16,power_law_1.01,0.23982079029083253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,16,power_law_1.01,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,16,power_law_1.01,0.2568192005157471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,16,power_law_1.01,0.30842878818511965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,16,power_law_1.01,0.3358720064163208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,16,power_law_1.01,0.4577280044555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,16,power_law_1.01,0.5816319942474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,16,power_law_1.01,0.9730048179626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,16,power_law_1.01,1.3856767654418944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,16,power_law_1.01,1.9197952270507812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,16,power_law_1.01,2.507571220397949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,16,power_law_1.2,2.578227233886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,2,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,2,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,2,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,2,balanced,0.07372800012429555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,2,balanced,0.27460267146428424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,2,balanced,0.5328213373819987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,2,balanced,0.537770668665568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,2,balanced,0.5387946764628092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,2,balanced,0.5430399974187216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,2,balanced,0.5459626515706381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,2,balanced,0.555178682009379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,2,balanced,0.5648800134658813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,2,balanced,0.5725866556167603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,2,balanced,0.5889706611633301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,2,balanced,0.6087679862976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,2,balanced,0.6248106559117635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,2,balanced,0.664576013882955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,2,balanced,0.7715840339660645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,2,balanced,0.8657920360565186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,2,balanced,1.083194653193156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,2,balanced,1.340928077697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,2,balanced,1.8566826184590657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,2,balanced,2.3058719635009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,2,balanced,3.330730756123861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,2,balanced,4.291584014892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,2,balanced,6.218069076538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,2,balanced,8.217599868774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,2,balanced,0.18210132916768393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,2,balanced,0.35140268007914227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,2,balanced,0.6703786849975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,2,balanced,1.300650676091512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,2,balanced,2.5569279988606772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,2,balanced,5.070842742919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,2,balanced,5.076821327209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,2,balanced,5.08842658996582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,2,balanced,5.093205451965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,16,power_law_1.2,4.058726501464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,2,balanced,5.1024214426676435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,2,balanced,5.115733464558919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,2,balanced,5.132970809936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,2,balanced,5.145600001017253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,2,balanced,5.1732479731241865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,2,balanced,5.2031145095825195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,2,balanced,5.228885332743327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,2,balanced,5.286725362141927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,2,balanced,5.544789632161458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,2,balanced,5.634218851725261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,2,balanced,5.822634379069011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,2,balanced,6.027093251546224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,16,power_law_1.01,1.054310417175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,2,balanced,6.1856428782145185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,16,power_law_1.01,2.0627328872680666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,16,power_law_1.01,2.103500747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,2,balanced,6.589951833089192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,16,power_law_1.01,1.9671039581298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,2,balanced,6.946816126505534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,16,power_law_1.01,2.069503974914551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,16,power_law_1.01,1.426022434234619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,16,power_law_1.01,1.7475584030151368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,2,balanced,7.59176508585612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,16,power_law_1.01,1.724825668334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,16,power_law_1.01,1.800806427001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,16,power_law_1.01,1.7324031829833983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,2,balanced,9.290581385294596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,16,power_law_1.01,1.8884607315063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,16,power_law_1.01,1.9304447174072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,16,power_law_1.01,1.9599359512329102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,2,balanced,11.689130147298178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,16,power_law_1.01,1.8309120178222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,16,power_law_1.01,1.9795967102050782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,16,power_law_1.01,2.0801536560058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,16,power_law_1.01,1.947648048400879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,16,power_law_1.01,2.2611967086791993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,16,power_law_1.01,2.225356864929199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,16,power_law_1.01,2.6214208602905273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,16,power_law_1.01,2.750873565673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,16,power_law_1.01,3.430400085449219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,16,power_law_1.01,4.223385620117187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,16,power_law_1.01,5.354086303710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,16,power_law_1.01,5.709823989868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,16,power_law_1.01,7.346380615234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,16,power_law_1.01,9.559859466552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,1,balanced,1.1142826875050862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,1,balanced,2.053290685017904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,1,balanced,4.128053347269694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,1,balanced,8.193509419759115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,1,balanced,15.92181396484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,1,balanced,31.821141560872395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,4,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,4,power_law_1.2,0.17940479516983032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,4,power_law_1.2,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,4,power_law_1.2,0.3749887943267822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,4,power_law_1.2,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,4,power_law_1.2,0.6221824169158936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,4,power_law_1.2,0.6684671878814697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,4,power_law_1.2,0.6776832103729248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,4,power_law_1.2,0.6967296123504638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,4,power_law_1.2,0.6504447937011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,4,power_law_1.2,0.6993919849395752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,4,power_law_1.2,0.718233585357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,4,power_law_1.2,0.7499775886535645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,4,power_law_1.2,0.7516160011291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,4,power_law_1.2,0.799948787689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,4,power_law_1.2,0.7854080200195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,1,balanced,31.8566411336263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,4,power_law_1.2,0.8388607978820801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,4,power_law_1.2,0.9168767929077148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,4,power_law_1.2,0.9490431785583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,4,power_law_1.2,1.2199935913085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,4,power_law_1.2,1.2148736000061036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,4,power_law_1.2,1.7152000427246095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,4,power_law_1.2,2.068889617919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,4,power_law_1.2,2.9544448852539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,4,power_law_1.2,3.4181121826171874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,1,balanced,31.871317545572918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,1,balanced,31.90868886311849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,1,balanced,31.935658772786457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,4,power_law_1.2,5.973811340332031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,1,balanced,32.00426737467448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,4,power_law_1.2,7.8788604736328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,1,balanced,32.05939229329427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,1,balanced,32.11383565266927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,1,balanced,32.209716796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,1,balanced,32.33757781982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,1,balanced,32.43639373779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,1,balanced,32.68128458658854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,1,balanced,34.04883829752604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,8,power_law_1.2,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,8,power_law_1.2,0.28035199642181396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,8,power_law_1.2,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,8,power_law_1.2,0.4448256015777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,8,power_law_1.2,0.49684481620788573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,1,balanced,34.81565856933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,8,power_law_1.2,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,8,power_law_1.2,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,8,power_law_1.2,0.5087232112884521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,8,power_law_1.2,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,8,power_law_1.2,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,16,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,16,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,8,power_law_1.2,0.5128191947937012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,16,balanced,0.24644267559051514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,16,balanced,0.2491626739501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,16,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,8,power_law_1.2,0.510975980758667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,16,balanced,0.2510506709416707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,16,balanced,0.2515626748402913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,16,balanced,0.25224532683690387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,16,balanced,0.2553173303604126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,8,power_law_1.2,0.5404416084289551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,16,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,16,balanced,0.258730669816335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,16,balanced,0.26265599330266315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,16,balanced,0.26845866441726685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,8,power_law_1.2,0.5781504154205322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,16,balanced,0.27187200387318927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,16,balanced,0.2786986629168193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,16,balanced,0.2901279926300049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,8,power_law_1.2,0.5914624214172364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,8,power_law_1.2,0.5824384212493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,8,power_law_1.2,0.6055871963500976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,8,power_law_1.2,0.6866943836212158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,16,balanced,0.2995199958483378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,16,balanced,0.3199999928474426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,16,balanced,0.35020800431569415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,1,balanced,35.566932678222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,8,power_law_1.2,0.7471104145050049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,16,balanced,0.40635732809702557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,16,balanced,0.46403201421101886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,8,power_law_1.2,0.8806400299072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,16,balanced,0.6106346845626831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,16,balanced,0.7741440137227377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,8,power_law_1.2,1.057753562927246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,16,balanced,1.2045653661092122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,8,power_law_1.2,1.4202879905700683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,16,balanced,1.624234676361084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,8,power_law_1.2,1.6066560745239258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,8,power_law_1.2,2.3836671829223635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,8,power_law_1.2,2.979635238647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,1,balanced,36.48887379964193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,8,power_law_1.2,4.354867172241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,32,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,32,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,32,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,32,balanced,0.05649066468079885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,32,balanced,0.2853546738624573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,32,balanced,0.5497066577275594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,32,balanced,0.5515893300374349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,32,balanced,0.5504000186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,32,balanced,0.5490346749623617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,32,balanced,0.549888014793396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,32,balanced,0.5546666781107584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,32,balanced,0.5575679937998453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,32,balanced,0.5597866773605347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,32,balanced,0.5611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,32,balanced,0.5679786602656046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,8,power_law_1.2,5.626643371582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,32,balanced,0.5703680117925009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,32,balanced,0.5797546704610189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,32,balanced,0.601253350575765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,32,balanced,0.6169600089391073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,32,balanced,0.6879573663075765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,32,balanced,0.6761813163757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,32,balanced,0.7679999669392904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,32,balanced,0.8120319843292236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,32,balanced,0.9873066743214926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,32,balanced,1.1533652941385906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,32,balanced,1.4603947003682454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,1,balanced,45.70641072591146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,32,balanced,1.8676053682963054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,1,balanced,60.37060038248698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.09646080136299133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,1,balanced,49.80427551269531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.5183487892150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.6871039867401123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,1,power_law_1.01,1.1329536437988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,1,power_law_1.01,1.1745280265808105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,1,power_law_1.01,1.2322815895080566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,1,power_law_1.01,1.2589056015014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,1,power_law_1.01,1.337343978881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,1,power_law_1.01,1.3760512351989747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,1,power_law_1.01,1.3913984298706055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,1,power_law_1.01,1.425203227996826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,1,power_law_1.01,1.4819328308105468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,1,power_law_1.01,1.537228775024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,1,power_law_1.01,1.5929344177246094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,1,power_law_1.01,1.6463872909545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,1,power_law_1.01,1.8122751235961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,1,balanced,51.69817606608073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,1,power_law_1.01,1.9816448211669921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,1,power_law_1.01,2.3570432662963867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,1,power_law_1.01,2.7443199157714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,1,power_law_1.01,3.565158462524414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,16,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,16,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,1,power_law_1.01,4.269875335693359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,16,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,16,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,16,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,16,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,16,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,16,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,16,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,1,power_law_1.01,5.968281555175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,16,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,16,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,16,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,16,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,16,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,1,power_law_1.01,7.584563446044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,16,power_law_1.01,0.07372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,16,power_law_1.01,0.09379199743270875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,16,power_law_1.01,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,16,power_law_1.01,0.17100800275802613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,1,balanced,64.88234456380208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,16,power_law_1.01,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,16,power_law_1.01,0.3543040037155151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,16,power_law_1.01,0.5115903854370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,16,power_law_1.01,0.8054783821105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,1,power_law_1.01,10.936921691894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,16,power_law_1.01,1.0620672225952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,1,power_law_1.01,14.267391967773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,1,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,1,power_law_1.01,0.04564479887485504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,1,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,1,power_law_1.01,0.17408000230789183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,1,power_law_1.01,0.28631041049957273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,1,power_law_1.01,0.35246078968048095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,1,power_law_1.01,0.5025792121887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,1,power_law_1.01,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,1,power_law_1.01,0.5498879909515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,1,power_law_1.01,0.5640192031860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,1,power_law_1.01,0.5820159912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,1,power_law_1.01,0.608460807800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,1,power_law_1.01,0.6201216220855713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,1,power_law_1.01,0.6473408222198487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,1,power_law_1.01,0.6651904106140136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,1,power_law_1.01,0.6854656219482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,1,power_law_1.01,0.7278592109680175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,1,power_law_1.01,0.8083456039428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,1,balanced,66.50845845540364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,1,power_law_1.01,0.892518424987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,1,power_law_1.01,1.0168319702148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,1,power_law_1.01,1.1851776123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,1,power_law_1.01,1.5212544441223144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,1,power_law_1.01,1.8552831649780273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,1,power_law_1.01,2.4805376052856447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,1,power_law_1.01,3.115212821960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,1,power_law_1.01,4.444979095458985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,1,power_law_1.01,5.841100692749023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,4,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,4,balanced,0.025594666600227356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,4,balanced,0.027295999228954315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,4,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,4,balanced,0.17510400215784708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,4,balanced,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,4,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,4,balanced,0.25224532683690387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,4,balanced,0.2529279987017314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,4,balanced,0.25412267446517944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,4,balanced,0.25514666239420575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,4,balanced,0.25753599405288696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,4,balanced,0.25804799795150757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,4,balanced,0.2611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,4,balanced,0.265557328859965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,4,balanced,0.2677759925524394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,4,balanced,0.2728959918022156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,4,balanced,0.272213339805603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,4,balanced,0.29320534070332843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,4,balanced,0.30293333530426025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,4,balanced,0.3336533308029175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,4,balanced,0.37614933649698895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,4,balanced,0.429909348487854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,4,balanced,0.6132053136825562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,4,balanced,0.7965013186136881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,4,balanced,1.2323839664459229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,4,balanced,1.5527253150939941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,8,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,8,power_law_1.01,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,8,power_law_1.01,0.1619968056678772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,8,power_law_1.01,0.1669119954109192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,8,power_law_1.01,0.18943359851837158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,8,power_law_1.01,0.2150399923324585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,8,power_law_1.01,0.2416640043258667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,8,power_law_1.01,0.23837440013885497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,8,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,8,power_law_1.01,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,8,power_law_1.01,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,8,power_law_1.01,0.25661439895629884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,8,power_law_1.01,0.25620479583740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,8,power_law_1.01,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,8,power_law_1.01,0.2910207986831665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,8,power_law_1.01,0.29675519466400146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,8,power_law_1.01,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,8,power_law_1.01,0.30945279598236086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,8,power_law_1.01,0.36267518997192383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,8,power_law_1.01,0.42905597686767577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,8,power_law_1.01,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,8,power_law_1.01,0.8151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,8,power_law_1.01,1.0663935661315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,8,power_law_1.01,1.5265791893005372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,8,power_law_1.01,2.0363264083862305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,8,power_law_1.01,2.8405759811401365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,8,power_law_1.01,3.816243362426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,64,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,64,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,64,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,64,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,64,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,64,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,64,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,64,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,64,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,64,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,64,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,64,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,64,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,64,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,64,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,64,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,64,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,64,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,64,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,64,balanced,0.07031466563542683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,64,balanced,0.08260266482830048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,64,balanced,0.11929600437482198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,64,balanced,0.1250986655553182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,64,balanced,0.22920533021291098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,64,balanced,0.28330665826797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,64,balanced,0.4266666571299235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,64,balanced,0.5174560149510702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,32,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,32,power_law_1.2,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,32,power_law_1.2,0.21398398876190186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,32,power_law_1.2,0.21299200057983397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,32,power_law_1.2,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,32,power_law_1.2,0.1078976035118103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,32,power_law_1.2,0.1810431957244873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,32,power_law_1.2,0.18800640106201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,32,power_law_1.2,0.1875839948654175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,32,power_law_1.2,0.1447808027267456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,32,power_law_1.2,0.18411519527435302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,32,power_law_1.2,0.20971519947052003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,32,power_law_1.2,0.16261119842529298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,32,power_law_1.2,0.1820672035217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,32,power_law_1.2,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,32,power_law_1.2,0.2234368085861206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,32,power_law_1.2,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,32,power_law_1.2,0.22814719676971434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,32,power_law_1.2,0.2590719938278198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,32,power_law_1.2,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,32,power_law_1.2,0.35983359813690186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,32,power_law_1.2,0.5822463989257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,32,power_law_1.2,0.6891520023345947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,32,power_law_1.2,0.9596927642822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,32,power_law_1.2,1.347379207611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,32,power_law_1.2,1.9902399063110352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,32,power_law_1.2,2.7406335830688477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,256,balanced,0.057162667314211525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,256,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,256,balanced,0.05714133381843567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,256,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,256,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,256,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,256,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,256,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,256,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,256,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,256,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,256,balanced,0.06860800087451935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,256,balanced,0.06929066777229309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,256,balanced,0.07082666456699371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,256,balanced,0.07372800012429555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,256,balanced,0.07492266595363617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,256,balanced,0.08021333316961925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,256,balanced,0.10103467106819153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,256,balanced,0.14298666516939798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,256,balanced,0.1979680061340332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,256,balanced,0.2146986722946167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,256,balanced,0.254805326461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,256,balanced,0.3089066743850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,256,balanced,0.4220586617787679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,256,balanced,0.5215573310852051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,256,balanced,0.7365972995758057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,256,balanced,0.9697226683298746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,4,power_law_1.2,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,4,power_law_1.2,0.15994880199432374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,4,power_law_1.2,0.1644544005393982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,4,power_law_1.2,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,4,power_law_1.2,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,4,power_law_1.2,0.2506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,4,power_law_1.2,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,4,power_law_1.2,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,4,power_law_1.2,0.2506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,4,power_law_1.2,0.25477120876312254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,4,power_law_1.2,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,4,power_law_1.2,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,4,power_law_1.2,0.2846719980239868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,4,power_law_1.2,0.3041280031204224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,4,power_law_1.2,0.3534784078598022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,4,power_law_1.2,0.318668794631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,4,power_law_1.2,0.42270717620849607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,4,power_law_1.2,0.5668863773345947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,4,power_law_1.2,0.6350848197937011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,4,power_law_1.2,0.809779167175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,64,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,64,balanced,0.021669333179791767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,64,balanced,0.021333334346612293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,64,balanced,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,64,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,64,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,64,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,64,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,64,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,64,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,64,balanced,0.023887999355793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,64,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,64,balanced,0.02420266717672348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,64,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,64,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,64,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,64,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,64,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,64,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,64,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,64,balanced,0.06400000055631001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,64,balanced,0.12611200412114462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,4,power_law_1.2,1.1390975952148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,64,balanced,0.27153066794077557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,64,balanced,0.3643733263015747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,4,power_law_1.2,1.5484928131103515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,4,power_law_1.01,0.601907205581665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,4,power_law_1.01,1.0577919960021973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,4,power_law_1.01,1.520025634765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,4,power_law_1.01,1.9167232513427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,4,power_law_1.01,2.274304008483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,4,power_law_1.01,2.425856018066406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,4,power_law_1.01,3.154739189147949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,4,power_law_1.01,3.295027160644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,4,power_law_1.01,3.401318359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,4,power_law_1.01,3.410521697998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,4,power_law_1.01,3.23768310546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,4,power_law_1.01,3.453337478637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,4,power_law_1.01,3.735347366333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,4,power_law_1.01,3.7140480041503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,4,power_law_1.2,2.3283712387084963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,4,power_law_1.01,3.6179969787597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,4,power_law_1.01,3.730636978149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,4,power_law_1.01,3.890585708618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,4,power_law_1.01,4.173619079589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,4,power_law_1.01,4.353023910522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,4,power_law_1.01,4.585472106933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,4,power_law_1.01,4.89799690246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,4,power_law_1.01,5.3639167785644535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,4,power_law_1.01,6.626713562011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,4,power_law_1.01,8.151449584960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,4,power_law_1.01,9.281536102294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,4,power_law_1.2,3.1356927871704103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,4,power_law_1.01,11.681382751464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,4,power_law_1.01,16.009625244140626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,4,power_law_1.2,4.627648162841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,4,power_law_1.2,6.109388732910157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,2,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,2,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,2,power_law_1.01,0.4448256015777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,2,power_law_1.01,0.6699007987976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,2,power_law_1.01,0.9334783554077148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,2,power_law_1.01,1.1868160247802735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,2,power_law_1.01,1.5417344093322753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,2,power_law_1.01,1.5437824249267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,2,power_law_1.01,1.6046079635620116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,2,power_law_1.01,1.780735969543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,2,power_law_1.01,1.6029695510864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,2,power_law_1.01,1.8329599380493165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,2,power_law_1.01,1.8247360229492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,2,power_law_1.01,1.9904512405395507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,2,power_law_1.01,1.9593215942382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,2,power_law_1.01,2.041235160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,2,power_law_1.01,2.0977664947509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,2,power_law_1.01,2.2716415405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,2,power_law_1.01,2.4242176055908202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,2,power_law_1.01,2.6656768798828123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,2,power_law_1.01,2.8807167053222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,2,power_law_1.01,3.6120574951171873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,2,power_law_1.01,4.05852165222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.6064127922058106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,2,power_law_1.01,5.356544113159179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,1,power_law_1.2,1.0475520133972167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,1,power_law_1.2,2.029567909240723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,2,power_law_1.01,6.507110595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,1,power_law_1.2,3.5948543548583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,1,power_law_1.2,5.345075225830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,2,power_law_1.01,9.09680633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,1,power_law_1.2,7.579647827148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,2,power_law_1.01,11.136409759521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,1,power_law_1.2,11.10855712890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,1,power_law_1.2,11.559935760498046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,1,power_law_1.2,12.288819122314454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,1,power_law_1.2,12.517990112304688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,1,power_law_1.2,13.350297546386718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,1,power_law_1.2,13.39166717529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,1,power_law_1.2,13.967155456542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,1,power_law_1.2,14.859263610839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,4,power_law_1.2,7.53623046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,1,power_law_1.2,15.165029907226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,1,power_law_1.2,15.313504028320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,1,power_law_1.2,16.36822967529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,1,power_law_1.2,17.140736389160157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,1,power_law_1.2,17.585356140136717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,1,power_law_1.2,18.686566162109376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,1,power_law_1.2,20.530380249023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,1,power_law_1.2,22.70740509033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,16,power_law_1.01,0.321126389503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,1,power_law_1.2,25.637478637695313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,16,power_law_1.01,0.5410816192626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,16,power_law_1.01,0.5468160152435303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,16,power_law_1.01,0.5273600101470948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,16,power_law_1.01,0.5609471797943115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,16,power_law_1.01,0.4476928234100342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,16,power_law_1.01,0.4892672061920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,16,power_law_1.01,0.4863999843597412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,16,power_law_1.01,0.5292031764984131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,16,power_law_1.01,0.47329277992248536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,16,power_law_1.01,0.522649621963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,16,power_law_1.01,0.5156864166259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,16,power_law_1.01,0.48250880241394045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,16,power_law_1.01,0.5148672103881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,16,power_law_1.01,0.5666816234588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,16,power_law_1.01,0.5363711833953857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,16,power_law_1.01,0.577126407623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,16,power_law_1.01,0.6039423942565918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,16,power_law_1.01,0.6338175773620606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,16,power_law_1.01,0.718233585357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,1,power_law_1.2,31.769790649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,16,power_law_1.01,0.7954432010650635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,16,power_law_1.01,0.9486335754394531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,16,power_law_1.01,1.1440128326416015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,16,power_law_1.01,1.6662527084350587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,16,power_law_1.01,2.1403648376464846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,16,power_law_1.01,3.182796859741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,1,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,16,power_law_1.01,3.867033767700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,1,power_law_1.2,0.12513279914855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,1,power_law_1.2,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,1,power_law_1.2,0.43909120559692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,1,power_law_1.2,0.5656576156616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,1,power_law_1.2,31.9098876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,1,power_law_1.2,1.0696703910827636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,1,power_law_1.2,1.1507712364196778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,1,power_law_1.2,1.2140543937683106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,1,power_law_1.2,1.2611583709716796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,1,power_law_1.2,1.2703743934631349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,1,power_law_1.2,1.3363200187683106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,1,power_law_1.2,1.3899776458740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,1,power_law_1.2,1.3893631935119628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,1,power_law_1.2,1.4514176368713378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,1,power_law_1.2,1.4950400352478028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,1,power_law_1.2,1.5366144180297852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,1,power_law_1.2,1.6166912078857423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,1,power_law_1.2,1.7899391174316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,1,power_law_1.2,1.945395278930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,1,power_law_1.2,2.2994943618774415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,1,power_law_1.2,2.6187776565551757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,1,power_law_1.2,41.1799560546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,1,power_law_1.2,3.2665599822998046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,1,power_law_1.2,3.7345279693603515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,1,power_law_1.2,5.01104621887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,1,power_law_1.2,6.436249542236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,1,power_law_1.2,50.15449523925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,4,power_law_1.2,0.18882559537887572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,4,power_law_1.2,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,4,power_law_1.2,0.4005887985229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,4,power_law_1.2,0.561356782913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,4,power_law_1.2,0.7358463764190674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,4,power_law_1.2,0.6719488143920899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,4,power_law_1.2,0.9302016258239746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,4,power_law_1.2,1.1044672012329102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,4,power_law_1.2,1.0659839630126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,4,power_law_1.2,1.0794943809509276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,4,power_law_1.2,1.1167743682861329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,1,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,4,power_law_1.2,1.1479040145874024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,1,power_law_1.2,9.28194580078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,1,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,4,power_law_1.2,1.1597503662109374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,1,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,1,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,1,power_law_1.2,0.09460480213165283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,1,power_law_1.2,0.14888960123062134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,1,power_law_1.2,0.260697603225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,4,power_law_1.2,1.2122112274169923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,1,power_law_1.2,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,1,power_law_1.2,0.2973695993423462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,4,power_law_1.2,1.2488703727722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,1,power_law_1.2,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,4,power_law_1.2,1.3058048248291017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,1,power_law_1.2,0.3172352075576782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,1,power_law_1.2,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,4,power_law_1.2,1.3283328056335448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,1,power_law_1.2,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,4,power_law_1.2,1.3404159545898438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,1,power_law_1.2,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,1,power_law_1.2,0.39178240299224854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,4,power_law_1.2,1.4045184135437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,1,power_law_1.2,0.41103358268737794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,1,power_law_1.2,0.44072961807250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,4,power_law_1.2,1.561190414428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,1,power_law_1.2,0.49500160217285155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,1,power_law_1.2,0.6025216102600097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,4,power_law_1.2,1.7416191101074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,1,power_law_1.2,0.7598080158233642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,1,power_law_1.2,0.9484288215637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,4,power_law_1.2,1.9984384536743165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,1,power_law_1.2,1.3111295700073242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,4,power_law_1.2,2.2898687362670898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,1,power_law_1.2,1.680793571472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,4,power_law_1.2,2.9509632110595705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,1,power_law_1.2,2.448588752746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,4,power_law_1.2,3.265087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,1,power_law_1.2,3.2454654693603517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,4,power_law_1.2,4.487782287597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,1,power_law_1.2,4.889804840087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,4,power_law_1.2,5.677465438842773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,1,power_law_1.2,6.551757049560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,1,power_law_1.2,12.002304077148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,8,power_law_1.2,0.05795199871063232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,8,power_law_1.2,0.2795520067214966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,8,power_law_1.2,0.29243519306182864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,8,power_law_1.2,0.38092799186706544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,8,power_law_1.2,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,8,power_law_1.2,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,8,power_law_1.2,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,8,power_law_1.2,0.4317183971405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,8,power_law_1.2,0.476364803314209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,8,power_law_1.2,0.5099520206451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,8,power_law_1.2,0.481279993057251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,8,power_law_1.2,0.5402624130249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,8,power_law_1.2,0.4880383968353271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,8,power_law_1.2,0.5312320232391358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,8,power_law_1.2,0.5380095958709716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,8,power_law_1.2,0.5580607891082764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,8,power_law_1.2,0.5683199882507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,8,power_law_1.2,0.6109055995941162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,8,power_law_1.2,0.6846271991729737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,8,power_law_1.2,0.7804927825927734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,8,power_law_1.2,0.8624128341674805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,8,power_law_1.2,1.0721280097961425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,8,power_law_1.2,1.3545472145080566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,8,power_law_1.2,2.007859230041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,8,power_law_1.2,2.579251289367676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,8,power_law_1.2,3.8725631713867186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,8,power_law_1.2,4.854169464111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,8,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,8,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,8,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,8,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,8,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,8,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,8,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,8,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,8,power_law_1.2,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,8,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,8,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,8,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,8,power_law_1.2,0.02928000092506409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,8,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,8,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,8,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,8,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,8,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,8,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,8,power_law_1.2,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,128,power_law_1.01,0.46100478172302245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,128,power_law_1.01,0.415334415435791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,128,power_law_1.01,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,128,power_law_1.01,0.415334415435791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,128,power_law_1.01,0.41738238334655764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,128,power_law_1.01,0.39403519630432127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,8,power_law_1.2,0.1505280017852783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,128,power_law_1.01,0.4233215808868408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,128,power_law_1.01,0.42287359237670896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,128,power_law_1.01,0.42575998306274415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,128,power_law_1.01,0.4263807773590088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,128,power_law_1.01,0.42987518310546874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,128,power_law_1.01,0.4325119972229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,128,power_law_1.01,0.43454718589782715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,128,power_law_1.01,0.43909120559692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,128,power_law_1.01,0.44462080001831056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,128,power_law_1.01,0.4632575988769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,128,power_law_1.01,0.4892672061920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,128,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,128,power_law_1.01,0.5558271884918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,128,power_law_1.01,0.6481919765472413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,8,power_law_1.2,0.20336639881134033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,128,power_law_1.01,0.6916096210479736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,128,power_law_1.01,0.9871359825134277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,128,power_law_1.01,1.3479935646057128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,128,power_law_1.01,1.801625633239746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,128,power_law_1.01,2.3418880462646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,128,power_law_1.01,3.358310317993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,128,power_law_1.01,4.58711051940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,8,power_law_1.2,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,8,power_law_1.2,0.454041576385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,8,power_law_1.2,0.6207488059997559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,1,balanced,0.30873600641886395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,1,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,1,balanced,1.0362666447957356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,1,balanced,2.0799147288004556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,1,balanced,4.055376052856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,1,balanced,7.971498489379883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,1,balanced,7.988224029541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,1,balanced,8.013823827107748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,1,balanced,8.031744003295898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,32,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,32,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,32,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,32,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,32,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,1,balanced,8.056490580240885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,32,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,32,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,32,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,32,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,32,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,32,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,32,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,1,balanced,8.095914840698242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,32,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,32,power_law_1.01,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,32,power_law_1.01,0.03459199965000152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,32,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,32,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,32,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,32,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,1,balanced,8.133632024129232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,32,power_law_1.01,0.05978239774703979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,32,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,32,power_law_1.01,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,32,power_law_1.01,0.14520319700241088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,32,power_law_1.01,0.25763840675354005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,32,power_law_1.01,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,1,balanced,8.165887832641602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,32,power_law_1.01,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,32,power_law_1.01,0.6279168128967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,1,balanced,8.227669397989908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,8,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,8,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,8,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,8,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,1,balanced,8.294399897257486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,8,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,8,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,8,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,8,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,8,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,8,power_law_1.01,0.03685120046138764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,1,balanced,8.354133605957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,8,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,8,power_law_1.01,0.04320639967918396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,8,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,8,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,8,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,1,balanced,8.483157475789389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,8,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,8,power_law_1.01,0.09441279768943786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,8,power_law_1.01,0.11752959489822387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,8,power_law_1.01,0.1640447974205017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,8,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,1,balanced,8.953856150309244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,8,power_law_1.01,0.31395840644836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,8,power_law_1.01,0.47370238304138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,8,power_law_1.01,0.6602752208709717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,8,power_law_1.01,1.0766336441040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,1,balanced,9.203370412190756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,8,power_law_1.01,1.5089664459228516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,1,balanced,9.659562428792318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,1,balanced,10.445482889811197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,1,balanced,11.039403279622396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,1,balanced,11.76593017578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,1,balanced,13.838165283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,1,balanced,15.981226603190104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,8,power_law_1.2,0.5992447853088378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,8,power_law_1.2,1.0360832214355469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,1,balanced,20.95957310994466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,8,power_law_1.2,1.5110143661499023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,8,power_law_1.2,1.8663423538208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,8,power_law_1.2,2.486067199707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,8,power_law_1.2,2.714214324951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,8,power_law_1.2,1.1198464393615724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,8,power_law_1.2,2.9272064208984374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,1,balanced,26.76153055826823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,8,power_law_1.2,2.4922111511230467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,8,power_law_1.2,2.8254207611083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,8,power_law_1.2,2.7250688552856444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,8,power_law_1.2,2.5206783294677733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,8,power_law_1.2,2.2794240951538085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,8,power_law_1.2,2.592767906188965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,8,power_law_1.2,2.6038272857666014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,8,power_law_1.2,2.5997312545776365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,8,power_law_1.2,2.5524223327636717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,8,power_law_1.2,2.733465576171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,8,power_law_1.2,2.834022331237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,8,power_law_1.2,3.0257152557373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,8,power_law_1.2,3.0060543060302733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,8,power_law_1.2,3.5276798248291015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,8,power_law_1.2,4.0253440856933596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,8,power_law_1.2,4.661248016357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,8,power_law_1.2,5.728044891357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,8,power_law_1.2,6.621798706054688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.1183743953704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.23630719184875487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.3305471897125244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,8,power_law_1.2,9.422847747802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.5703680038452148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.6340608119964599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.6535168170928956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.6899456024169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.7026688098907471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.7362559795379638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.7608320236206054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.7886591911315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,8,power_law_1.2,10.208863830566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.8283967971801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.8562687873840332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.9029631614685059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.9709568023681641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,1,power_law_1.2,1.1499520301818849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,1,power_law_1.2,1.341433620452881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,1,power_law_1.2,1.6672767639160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,1,power_law_1.2,1.9990528106689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,1,power_law_1.2,2.754969596862793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,1,power_law_1.2,3.5356544494628905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,1,power_law_1.2,5.164441680908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,1,power_law_1.2,6.771501159667968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,1,power_law_1.2,9.98131866455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,8,power_law_1.2,1.491763210296631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,1,power_law_1.2,13.171302795410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,8,power_law_1.01,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,8,power_law_1.01,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,8,power_law_1.01,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,8,power_law_1.01,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,8,power_law_1.01,0.471449613571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,8,power_law_1.01,0.4777984142303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,8,power_law_1.01,0.5892096042633057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,8,power_law_1.01,0.7012351989746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,8,power_law_1.01,0.8157183647155761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,8,power_law_1.01,0.9901951789855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,8,power_law_1.01,0.8089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,8,power_law_1.01,0.9205760002136231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,8,power_law_1.01,1.1577343940734863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,8,power_law_1.01,1.3469696044921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,8,power_law_1.01,1.518777561187744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,8,power_law_1.01,1.9863487243652345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,8,power_law_1.01,2.531123161315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,8,power_law_1.01,3.568435287475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,8,power_law_1.01,4.180582427978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,8,power_law_1.01,5.110572814941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,8,power_law_1.01,5.881446456909179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,8,power_law_1.01,7.642316436767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,8,power_law_1.01,9.317171478271485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,2,power_law_1.2,0.054048001766204834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,2,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,2,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,2,power_law_1.2,0.20889599323272706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,2,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,2,power_law_1.2,0.37742080688476565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,2,power_law_1.2,0.4220928192138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,2,power_law_1.2,0.5519360065460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,8,power_law_1.01,12.255232238769532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,2,power_law_1.2,0.6062079906463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,2,power_law_1.2,0.557260799407959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,2,power_law_1.2,0.5908160209655762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,2,power_law_1.2,0.6827839851379395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,2,power_law_1.2,0.7065599918365478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,2,power_law_1.2,0.6914048194885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,2,power_law_1.2,0.7430143833160401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,2,power_law_1.2,0.7503871917724609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,2,power_law_1.2,0.8259584426879882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,2,power_law_1.2,0.9232255935668945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,2,power_law_1.2,1.0555392265319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,2,power_law_1.2,1.2386303901672364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,2,power_law_1.2,1.5335424423217774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,2,power_law_1.2,1.965260887145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,2,power_law_1.2,2.285772705078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,2,power_law_1.2,3.077734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,2,power_law_1.2,3.9796737670898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,2,power_law_1.2,5.972377777099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,2,power_law_1.2,7.280812835693359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,8,power_law_1.01,14.891827392578126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,8,power_law_1.01,22.16468505859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,8,power_law_1.01,26.600244140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,8,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,8,power_law_1.01,0.041356799006462094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,8,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,8,power_law_1.01,0.04337919950485229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,8,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,8,power_law_1.01,0.045459198951721194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,8,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,8,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,8,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,8,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,8,power_law_1.01,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,8,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,8,power_law_1.01,0.05548160076141358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,8,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,8,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,8,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,8,power_law_1.01,0.09154559969902039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,8,power_law_1.01,0.11857919692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,8,power_law_1.01,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,8,power_law_1.01,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,8,power_law_1.01,0.4487167835235596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,8,power_law_1.01,0.6627327919006347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,8,power_law_1.01,1.0659647941589356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,8,power_law_1.01,1.4501888275146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,16,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,16,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,16,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,16,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,16,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,16,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,16,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,16,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,16,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,16,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,16,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,16,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,16,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,16,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,16,power_law_1.2,0.051596802473068235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,16,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,16,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,16,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,16,power_law_1.2,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,16,power_law_1.2,0.10035200119018554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,16,power_law_1.2,0.12390400171279907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,16,power_law_1.2,0.20049281120300294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,16,power_law_1.2,0.2830336093902588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,16,power_law_1.2,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,16,power_law_1.2,0.5677055835723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,16,power_law_1.2,1.1333632469177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,16,power_law_1.2,1.4725119590759277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,8,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,8,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,8,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,8,balanced,0.0727040022611618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,8,balanced,0.2754559914271037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,8,balanced,0.5416959921518961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,8,balanced,0.5440853436787924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,8,balanced,0.5437440077463785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,8,balanced,0.5456000169118246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,8,balanced,0.5476693312327067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,8,balanced,0.5551520188649496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,8,balanced,0.560640017191569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,8,balanced,0.5638826688130697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,8,balanced,0.5666133165359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,8,balanced,0.5766826470692953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,8,balanced,0.5826559861501058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,8,balanced,0.5980159838994344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,8,balanced,0.6297599871953329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,8,balanced,0.667306661605835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,8,balanced,0.7031466960906982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,8,balanced,0.7749973138173422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,8,balanced,0.9263573487599691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,8,balanced,1.0910720030466716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,8,balanced,1.4540799458821614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,8,balanced,1.844223976135254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,8,balanced,2.5396906534830728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,8,balanced,3.1962238947550454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,16,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,16,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,16,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,16,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,16,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,16,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,16,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,16,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,16,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,16,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,16,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,16,balanced,0.05323199927806854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,16,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,16,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,16,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,16,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,16,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,16,balanced,0.07441066702206929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,16,balanced,0.08447999755541484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,16,balanced,0.18722132841746011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,16,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,16,balanced,0.34406399726867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,16,balanced,0.457045316696167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,16,balanced,0.6905173460642496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,16,balanced,0.9328640302022299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,16,balanced,1.4149972597757976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,16,balanced,1.9063466389973958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,8,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,8,power_law_1.2,0.055078399181365964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,8,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,8,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,8,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,8,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,8,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,8,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,8,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,8,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,8,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,8,power_law_1.2,0.06715520024299622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,8,power_law_1.2,0.06858879923820496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,8,power_law_1.2,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,8,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,8,power_law_1.2,0.08273280262947083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,8,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,8,power_law_1.2,0.15196160078048707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,8,power_law_1.2,0.2041856050491333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,8,power_law_1.2,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,8,power_law_1.2,0.3800895929336548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,8,power_law_1.2,0.6338560104370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,8,power_law_1.2,0.8599552154541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,8,power_law_1.2,1.3813759803771972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,8,power_law_1.2,1.743462371826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,1,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,1,balanced,0.2764799992243449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,1,balanced,0.5312853256861368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,1,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,1,balanced,0.5254826545715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,1,balanced,0.529578685760498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,1,balanced,0.5331626733144125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,1,balanced,0.5355519851048788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,1,balanced,0.5396480162938436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,1,balanced,0.5425493319829305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,1,balanced,0.5589333375295004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,1,balanced,0.566271980603536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,1,balanced,0.5737813313802084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,1,balanced,0.5790719985961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,1,balanced,0.571562647819519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,1,balanced,0.582314650217692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,8,power_law_1.2,2.5364479064941405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,1,balanced,0.6183253526687622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,1,balanced,0.6654293139775594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,1,balanced,0.7418879667917887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,1,balanced,0.9024853706359863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,1,balanced,1.160533348719279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,1,balanced,1.684991995493571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,1,balanced,2.2318080266316733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,1,balanced,3.351711908976237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,1,balanced,4.473685264587402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,1,balanced,6.585344314575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,1,balanced,8.7280642191569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,1,balanced,0.07167999943097432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,1,balanced,0.28074665864308673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,1,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,1,balanced,1.0332159996032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,1,balanced,2.0312746365865073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,1,balanced,4.029952049255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,1,balanced,4.04531192779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,1,balanced,4.065962791442871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,1,balanced,4.083029429117839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,1,balanced,4.101973215738933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,1,balanced,4.123818715413411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,1,balanced,4.151290575663249
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,1,balanced,4.176042556762695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,1,balanced,4.238165219624837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,1,balanced,4.28817081451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,1,balanced,4.343978563944499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,1,balanced,4.448767979939778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,8,power_law_1.2,3.6892673492431642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,1,balanced,4.737194697062175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,1,balanced,4.925098737080892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,1,balanced,5.331967989603679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,1,balanced,5.785770416259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,1,balanced,6.671530405680339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,1,balanced,7.65388298034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,1,balanced,9.845071792602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,1,balanced,11.588090260823568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,1,balanced,16.13465627034505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,1,balanced,19.568810780843098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,1,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,1,power_law_1.01,0.3004415988922119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,1,power_law_1.01,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,1,power_law_1.01,1.0217472076416017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,1,power_law_1.01,1.521459197998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,1,power_law_1.01,1.9781631469726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,1,power_law_1.01,2.879283142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,1,power_law_1.01,3.01342716217041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,1,power_law_1.01,3.097395133972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,1,power_law_1.01,3.215769577026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,1,power_law_1.01,3.3781761169433593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,1,power_law_1.01,3.384921646118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,1,power_law_1.01,3.505971145629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,1,power_law_1.01,3.5829631805419924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,1,power_law_1.01,3.7775360107421876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,1,power_law_1.01,3.751116943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,1,power_law_1.01,3.9294975280761717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,1,power_law_1.01,4.258816146850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,1,power_law_1.01,4.45030403137207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,1,power_law_1.01,4.838809585571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,1,power_law_1.01,5.327872085571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,1,power_law_1.01,5.967052841186524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,1,power_law_1.01,7.103488159179688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,1,power_law_1.01,9.077760314941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,1,power_law_1.01,10.398310089111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,1,power_law_1.01,14.425497436523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,1,power_law_1.01,17.509580993652342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,4,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,4,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,4,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,4,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,4,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,4,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,4,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,4,power_law_1.01,0.05915520191192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,4,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,4,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,4,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,4,power_law_1.01,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,4,power_law_1.01,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,4,power_law_1.01,0.12021759748458863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,4,power_law_1.01,0.1376255989074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,4,power_law_1.01,0.13864320516586304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,4,power_law_1.01,0.17428480386734008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,4,power_law_1.01,0.2371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,4,power_law_1.01,0.32563199996948244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,4,power_law_1.01,0.5095424175262451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,4,power_law_1.01,0.6082560062408447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,4,power_law_1.01,0.8626175880432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,4,power_law_1.01,1.127014446258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,4,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,4,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,4,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,4,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,4,power_law_1.2,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,4,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,4,power_law_1.2,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,4,power_law_1.2,0.21623680591583253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,4,power_law_1.2,0.16855039596557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,4,power_law_1.2,0.13864959478378297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,4,power_law_1.2,0.16138240098953247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,4,power_law_1.2,0.1820672035217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,4,power_law_1.2,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,4,power_law_1.2,0.21442561149597167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,4,power_law_1.2,0.23797760009765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,4,power_law_1.2,0.2604736089706421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,4,power_law_1.2,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,4,power_law_1.2,0.33239040374755857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,4,power_law_1.2,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,4,power_law_1.2,0.4640768051147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,4,power_law_1.2,0.5781504154205322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,4,power_law_1.2,0.8144895553588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,4,power_law_1.01,2.142585563659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,4,power_law_1.2,1.1255807876586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,4,power_law_1.2,1.8073600769042968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,4,power_law_1.2,2.598502349853516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,4,power_law_1.2,3.9223297119140623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,4,power_law_1.2,4.843110275268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,4,power_law_1.01,2.33492488861084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,4,power_law_1.01,3.852083206176758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,4,power_law_1.01,4.915609741210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,32,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,32,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,32,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,32,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,32,power_law_1.2,0.028460800647735596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,32,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,32,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,32,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,32,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,32,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,32,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,32,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,32,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,32,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,32,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,32,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,32,power_law_1.2,0.05384960174560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,32,power_law_1.2,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,32,power_law_1.2,0.0894976019859314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,32,power_law_1.2,0.11407359838485717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,32,power_law_1.2,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,32,power_law_1.2,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,32,power_law_1.2,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,32,power_law_1.2,0.45055999755859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,32,power_law_1.2,0.643071985244751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,32,power_law_1.2,1.0176511764526368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,32,power_law_1.2,1.3912063598632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,4,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,4,power_law_1.2,0.07799040079116822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,4,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,4,power_law_1.2,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,4,power_law_1.2,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,4,power_law_1.2,0.24944000244140624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,4,power_law_1.2,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,4,power_law_1.2,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,4,power_law_1.2,0.346726393699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,4,power_law_1.2,0.36126720905303955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,4,power_law_1.2,0.34611198902130125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,4,power_law_1.2,0.3446784019470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,4,power_law_1.2,0.35041279792785646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,4,power_law_1.2,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,4,power_law_1.2,0.3858432054519653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,4,power_law_1.2,0.4476928234100342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,4,power_law_1.2,0.4651008129119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,4,power_law_1.2,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,4,power_law_1.2,0.5750527858734131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,4,power_law_1.2,0.6688767910003662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,4,power_law_1.2,0.8015872001647949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,4,power_law_1.2,1.0112704277038573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,4,power_law_1.2,1.3682687759399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,4,power_law_1.2,1.9808256149291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,4,power_law_1.2,2.5145343780517577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,4,power_law_1.2,4.013670349121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,4,power_law_1.2,5.101158523559571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,32,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,32,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,32,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,32,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,32,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,32,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,32,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,32,balanced,0.029343999922275543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,32,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,32,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,32,balanced,0.03019733230272929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,32,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,32,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,32,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,32,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,32,balanced,0.03463999927043915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,32,balanced,0.0360000009338061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,32,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,32,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,32,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,32,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,32,balanced,0.09454933802286784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,32,balanced,0.20940800507863364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,32,balanced,0.3130026658376058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,32,balanced,0.40277334054311115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,32,balanced,0.6454613208770752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,32,balanced,0.8470186392466227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,4,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,4,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,4,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,4,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,4,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,4,power_law_1.01,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,4,power_law_1.01,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,4,power_law_1.01,0.1419263958930969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,4,power_law_1.01,0.17408000230789183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,4,power_law_1.01,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,4,power_law_1.01,0.17489919662475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,4,power_law_1.01,0.17694720029830932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,4,power_law_1.01,0.19906560182571412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,4,power_law_1.01,0.2258944034576416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,4,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,4,power_law_1.01,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,4,power_law_1.01,0.2762752056121826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,4,power_law_1.01,0.31969280242919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,4,power_law_1.01,0.369868803024292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,4,power_law_1.01,0.454860782623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,4,power_law_1.01,0.5447679996490479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,4,power_law_1.01,0.8202239990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,4,power_law_1.01,1.103872013092041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,4,power_law_1.01,1.6805696487426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,4,power_law_1.01,2.29171199798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,4,power_law_1.01,3.340902328491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,4,power_law_1.01,4.443750381469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,32,power_law_1.2,0.19025919437408448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,32,power_law_1.2,0.18882559537887572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,32,power_law_1.2,0.1892351984977722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,32,power_law_1.2,0.18922879695892333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,32,power_law_1.2,0.14540799856185913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,32,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,32,power_law_1.2,0.12062720060348511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,32,power_law_1.2,0.0894976019859314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,32,power_law_1.2,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,32,power_law_1.2,0.09154559969902039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,32,power_law_1.2,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,32,power_law_1.2,0.14069759845733643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,32,power_law_1.2,0.1482751965522766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,32,power_law_1.2,0.12390400171279907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,32,power_law_1.2,0.11079679727554322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,32,power_law_1.2,0.15849599838256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,32,power_law_1.2,0.18227200508117675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,32,power_law_1.2,0.2136064052581787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,32,power_law_1.2,0.18903039693832396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,32,power_law_1.2,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,32,power_law_1.2,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,32,power_law_1.2,0.4603903770446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,32,power_law_1.2,0.45199360847473147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,32,power_law_1.2,0.7442304134368897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,32,power_law_1.2,0.9175040245056152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,32,power_law_1.2,1.6168960571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,32,power_law_1.2,2.083225631713867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,2,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,2,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,2,power_law_1.01,0.08212479948997498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,2,power_law_1.01,0.12247040271759033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,2,power_law_1.01,0.19066879749298096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,2,power_law_1.01,0.313753604888916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,2,power_law_1.01,0.3282880067825317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,2,power_law_1.01,0.3506175994873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,2,power_law_1.01,0.369868803024292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,2,power_law_1.01,0.3708928108215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,2,power_law_1.01,0.39137279987335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,2,power_law_1.01,0.39813120365142823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,2,power_law_1.01,0.4055039882659912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,2,power_law_1.01,0.4228991985321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,2,power_law_1.01,0.44707841873168946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,2,power_law_1.01,0.46489601135253905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,2,power_law_1.01,0.5013504028320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,2,power_law_1.01,0.5816319942474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,2,power_law_1.01,0.6559743881225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,2,power_law_1.01,0.8841216087341308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,2,power_law_1.01,1.0944448471069337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,2,power_law_1.01,1.5249407768249512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,2,power_law_1.01,1.9746816635131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,2,power_law_1.01,2.934579277038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,2,power_law_1.01,4.0364032745361325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,2,power_law_1.01,5.702246475219726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,2,power_law_1.01,7.364198303222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,4,balanced,0.023365333676338196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,4,balanced,0.023717333873112995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,4,balanced,0.23244800170262656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,4,balanced,0.44356266657511395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,4,balanced,0.4517546494801839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,4,balanced,0.45293867588043213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,4,balanced,0.4500480095545451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,4,balanced,0.4514133135477702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,4,balanced,0.452949325243632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,4,balanced,0.4561866521835327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,4,balanced,0.4612853527069092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,4,balanced,0.46455466747283936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,4,balanced,0.46933333079020184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,4,balanced,0.48264535268147785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,4,balanced,0.48657067616780597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,4,balanced,0.49715201059977215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,4,balanced,0.48298664887746173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,4,balanced,0.5186560153961182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,4,balanced,0.5468159914016724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,4,balanced,0.5684906641642252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,4,balanced,0.6876160303751627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,4,balanced,0.719701369603475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,4,balanced,0.9210879802703857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,4,balanced,1.2118826707204182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,4,balanced,1.7976214090983074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,4,balanced,2.400767962137858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,128,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,128,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,128,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,128,power_law_1.01,0.04987519979476929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,128,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,128,power_law_1.01,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,128,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,128,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,128,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,128,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,128,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,128,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,128,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,128,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,128,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,128,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,128,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,128,power_law_1.01,0.0942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,128,power_law_1.01,0.11018240451812744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,128,power_law_1.01,0.22159359455108643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,128,power_law_1.01,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,128,power_law_1.01,0.41327362060546874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,128,power_law_1.01,0.587775993347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,128,power_law_1.01,0.8564672470092773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,128,power_law_1.01,1.2525568008422852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,128,power_law_1.01,1.8696191787719727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,128,power_law_1.01,2.4102848052978514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,4,power_law_1.2,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,4,power_law_1.2,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,4,power_law_1.2,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,4,power_law_1.2,0.6221824169158936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,4,power_law_1.2,0.8300543785095215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,4,power_law_1.2,1.1223039627075195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,4,power_law_1.2,1.2720128059387208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,4,power_law_1.2,1.2638208389282226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,4,power_law_1.2,1.2701696395874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,4,power_law_1.2,1.285529613494873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,4,power_law_1.2,1.2969984054565429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,4,power_law_1.2,1.3858816146850585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,4,power_law_1.2,1.3826047897338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,4,power_law_1.2,1.4254079818725587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,4,power_law_1.2,1.4645248413085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,4,power_law_1.2,1.4649344444274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,4,power_law_1.2,1.5781888008117675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,4,power_law_1.2,1.6361471176147462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,4,power_law_1.2,1.76312313079834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,4,power_law_1.2,1.9310272216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,4,power_law_1.2,2.2159360885620116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,4,power_law_1.2,2.8055551528930662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,4,power_law_1.2,2.912256050109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,4,power_law_1.2,4.1598976135253904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,4,power_law_1.2,5.445427322387696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,4,power_law_1.2,7.501414489746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,4,power_law_1.2,10.881843566894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,128,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,128,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,128,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,128,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,128,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,128,power_law_1.2,0.057734400033950806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,128,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,128,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,128,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,128,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,128,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,128,power_law_1.2,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,128,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,128,power_law_1.2,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,128,power_law_1.2,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,128,power_law_1.2,0.09502720236778259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,128,power_law_1.2,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,128,power_law_1.2,0.1937407970428467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,128,power_law_1.2,0.2742271900177002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,128,power_law_1.2,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,128,power_law_1.2,0.5216256141662597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,128,power_law_1.2,0.6895616054534912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,128,power_law_1.2,1.0160127639770509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,128,power_law_1.2,1.551974391937256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,128,power_law_1.2,2.3132160186767576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,128,power_law_1.2,3.4330623626708983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,128,power_law_1.2,4.640153503417968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,64,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,64,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,64,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,64,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,64,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,64,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,64,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,4,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,4,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,64,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,4,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,4,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,4,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,4,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,64,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,4,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,4,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,4,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,64,power_law_1.01,0.025785601139068602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,4,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,4,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,4,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,64,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,4,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,4,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,64,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,4,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,4,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,64,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,64,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,64,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,64,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,64,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,4,balanced,0.08157866696516673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,64,power_law_1.01,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,4,balanced,0.09130666653315227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,4,balanced,0.13141333063443503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,4,balanced,0.17151999473571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,64,power_law_1.01,0.10342400074005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,4,balanced,0.27938133478164673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,64,power_law_1.01,0.12472319602966309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,4,balanced,0.38229334354400635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,4,balanced,0.5800960063934326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,64,power_law_1.01,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,4,balanced,0.7905279795328776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,64,power_law_1.01,0.33239040374755857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,4,balanced,1.225215991338094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,64,power_law_1.01,0.4782080173492432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,4,balanced,1.6895999908447266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,64,power_law_1.01,0.6834176063537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,8,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,8,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,8,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,8,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,8,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,8,balanced,0.05919999877611796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,8,balanced,0.059706668059031166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,8,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,8,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,8,balanced,0.06073066592216492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,8,balanced,0.06177066763242086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,8,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,8,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,8,balanced,0.06534400085608165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,8,balanced,0.0682666649421056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,8,balanced,0.06929066777229309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,8,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,8,balanced,0.10291199882825215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,8,balanced,0.14267733693122864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,8,balanced,0.21998933951059976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,8,balanced,0.2783413330713908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,8,balanced,0.37666134039560956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,8,balanced,0.48622934023539227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,8,balanced,0.823637326558431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,8,balanced,1.1463680267333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,8,balanced,1.7346560160319011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,8,balanced,2.310826619466146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,16,power_law_1.01,0.5986303806304931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,16,power_law_1.01,0.7026688098907471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,16,power_law_1.01,0.6238207817077637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,16,power_law_1.01,0.6905856132507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,16,power_law_1.01,0.6070144176483154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,16,power_law_1.01,0.6426432132720947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,16,power_law_1.01,0.6592512130737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,16,power_law_1.01,0.7168000221252442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,16,power_law_1.01,0.6805439949035644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,16,power_law_1.01,0.6944767951965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,16,power_law_1.01,0.6846144199371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,16,power_law_1.01,0.7030784130096436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,16,power_law_1.01,0.6924287796020507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,16,power_law_1.01,0.735641622543335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,16,power_law_1.01,0.7647232055664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,16,power_law_1.01,0.7276544094085693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,16,power_law_1.01,0.7573376178741456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,16,power_law_1.01,0.8525823593139649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,16,power_law_1.01,0.8591360092163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,16,power_law_1.01,1.032595157623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,16,power_law_1.01,1.264025592803955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,16,power_law_1.01,1.529651165008545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,16,power_law_1.01,2.229452705383301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,16,power_law_1.01,2.97390079498291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,16,power_law_1.01,3.341299057006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,16,power_law_1.01,5.1757057189941404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,16,power_law_1.01,6.11409912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,4,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,4,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,4,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,4,balanced,0.24661332368850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,4,balanced,0.4580693244934082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,4,balanced,0.460970679918925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,4,balanced,0.4631893237431844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,4,balanced,0.46506667137145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,4,balanced,0.4940640131632487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,4,balanced,0.4684799909591675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,4,balanced,0.47274665037790936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,4,balanced,0.4776959816614787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,4,balanced,0.48110934098561603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,4,balanced,0.4828159809112549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,4,balanced,0.49237334728240967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,4,balanced,0.49885865052541095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,4,balanced,0.5178026755650839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,4,balanced,0.5468159914016724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,4,balanced,0.5698560078938802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,4,balanced,0.6212266683578491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,4,balanced,0.6758399804433187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,4,balanced,0.79257599512736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,4,balanced,0.9410560131072998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,4,balanced,1.268053372701009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,4,balanced,1.606485366821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,4,balanced,2.368170738220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,16,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,16,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,16,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,16,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,16,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,16,balanced,0.03497066597143809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,16,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,16,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,16,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,16,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,16,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,16,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,16,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,16,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,16,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,16,balanced,0.06673066814740498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,16,balanced,0.12032000223795573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,16,balanced,0.1962666710217794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,16,balanced,0.23091200987497965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,16,balanced,0.29320534070332843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,16,balanced,0.33740798632303876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,4,balanced,3.193514823913574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,16,balanced,0.4517546494801839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,16,balanced,0.5708800156911215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,16,balanced,0.920576016108195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,16,balanced,1.2180480162302654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,256,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,256,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,256,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,256,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,256,balanced,0.05204799771308899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,256,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,256,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,256,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,256,balanced,0.054602667689323425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,256,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,256,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,256,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,256,balanced,0.05782933533191681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,256,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,256,balanced,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,256,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,256,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,256,balanced,0.07423999905586243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,256,balanced,0.08171733220418294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,256,balanced,0.13942933082580566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,256,balanced,0.2367146611213684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,256,balanced,0.3193173408508301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,256,balanced,0.3959466616312663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,256,balanced,0.5553493499755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,256,balanced,0.7164586385091146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,256,balanced,1.0584746996561687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,256,balanced,1.4110719362894695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,8,power_law_1.2,0.566054391860962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,8,power_law_1.2,1.070899200439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,8,power_law_1.2,1.5538175582885743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,1,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,1,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,1,balanced,0.45293867588043213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,1,balanced,0.8867839972178141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,8,power_law_1.2,1.802841567993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,1,balanced,1.7421654065450032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,1,balanced,1.7517226537068684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,8,power_law_1.2,2.163302421569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,1,balanced,1.759061336517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,1,balanced,1.7658880551656086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,1,balanced,1.77510404586792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,8,power_law_1.2,2.716671943664551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,1,balanced,1.7824427286783855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,1,balanced,1.7996800740559895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,1,balanced,1.8216959635416667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,8,power_law_1.2,2.6060800552368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,1,balanced,1.8326187133789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,1,balanced,1.8691412607828777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,1,balanced,1.935530662536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,8,power_law_1.2,2.8389375686645506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,1,balanced,1.9642027219136555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,1,balanced,2.02837340037028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,8,power_law_1.2,2.446131134033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,1,balanced,2.610175927480062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,1,balanced,2.223957379659017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,8,power_law_1.2,2.2521791458129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,1,balanced,2.4511146545410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,1,balanced,2.674346605936686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,8,power_law_1.2,2.2562816619873045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,1,balanced,3.2414719263712564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,8,power_law_1.2,2.6206207275390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,1,balanced,3.760298728942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,8,power_law_1.2,2.405171203613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,1,balanced,4.928341229756673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,8,power_law_1.2,2.7531200408935548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,8,power_law_1.2,2.8008447647094727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,1,balanced,6.316202799479167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,8,power_law_1.2,2.637004852294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,1,balanced,9.169066747029623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,8,power_law_1.2,2.912870407104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,8,power_law_1.2,3.0031871795654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,8,power_law_1.2,3.176038360595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,1,balanced,11.944960276285807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,8,power_law_1.2,3.3249279022216798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,8,power_law_1.2,3.5604480743408202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,8,power_law_1.2,3.97127685546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,8,power_law_1.2,4.637081527709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,8,power_law_1.2,6.515711975097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,8,power_law_1.2,7.511859130859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,8,power_law_1.2,10.052812957763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,8,power_law_1.2,11.070054626464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.3842047929763794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.5380095958709716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.8857600212097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.8630208015441895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.9142271995544433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.9461759567260742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.9443327903747558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.9604991912841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,128,power_law_1.2,0.04935039877891541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.9762816429138184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.9912320137023926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.9803775787353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,1,power_law_1.2,1.033011245727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,128,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,1,power_law_1.2,1.123737621307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,128,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,128,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,1,power_law_1.2,1.1282431602478027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,128,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,128,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,1,power_law_1.2,1.2740608215332032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,128,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,128,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,128,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,1,power_law_1.2,1.428275203704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,128,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,128,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,128,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,128,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,128,power_law_1.2,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,128,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,128,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,128,power_law_1.2,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,128,power_law_1.2,0.11345920562744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,128,power_law_1.2,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,1,power_law_1.2,1.5861760139465333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,128,power_law_1.2,0.18288639783859253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,128,power_law_1.2,0.2623487949371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,128,power_law_1.2,0.4009984016418457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,1,power_law_1.2,1.8880512237548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,128,power_law_1.2,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,128,power_law_1.2,0.8200192451477051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,128,power_law_1.2,1.1593728065490723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,1,power_law_1.2,2.252595138549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,1,power_law_1.2,3.113574409484863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,128,power_law_1.2,1.9795967102050782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,8,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,8,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,8,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,8,balanced,0.5394773483276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,8,balanced,1.042944033940633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,8,balanced,2.0106239318847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,8,balanced,2.9916159311930337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,8,balanced,2.995370546976725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,8,balanced,3.000831921895345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,8,balanced,3.00492795308431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,8,balanced,3.070805231730143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,128,power_law_1.2,2.406809616088867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,8,balanced,3.081557273864746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,8,balanced,3.0912853876749673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,8,balanced,3.050138791402181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,8,balanced,3.0677334467569985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,8,balanced,3.081045468648275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,8,balanced,3.110912005106608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,8,balanced,3.1658665339152017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,8,balanced,3.217066764831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,8,balanced,3.31059201558431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,8,balanced,3.4036054611206055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,8,balanced,3.615546544392904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,8,balanced,3.827882766723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,8,balanced,4.207786560058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,8,balanced,4.528298695882161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,1,power_law_1.2,3.989913558959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,8,balanced,5.425834655761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,8,balanced,6.65070915222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,1,power_law_1.2,5.595750427246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,1,power_law_1.2,7.090380859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,8,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,8,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,8,power_law_1.01,0.0722815990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,1,power_law_1.2,10.480435180664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,8,power_law_1.01,0.0669376015663147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,8,power_law_1.01,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,8,power_law_1.01,0.11632640361785888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,8,power_law_1.01,0.16933759450912475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,8,power_law_1.01,0.19169280529022217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,8,power_law_1.01,0.15111680030822755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,8,power_law_1.01,0.1763327956199646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,8,power_law_1.01,0.1533951997756958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,8,power_law_1.01,0.14661120176315307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,8,power_law_1.01,0.15831040143966674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,8,power_law_1.01,0.1773568034172058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,8,power_law_1.01,0.20439040660858154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,8,power_law_1.01,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,8,power_law_1.01,0.2289664030075073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,8,power_law_1.01,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,8,power_law_1.01,0.2791424036026001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,8,power_law_1.01,0.3352576017379761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,8,power_law_1.01,0.38622078895568845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,8,power_law_1.01,0.6526976108551026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,8,power_law_1.01,0.8501184463500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,8,power_law_1.01,1.3600768089294433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,8,power_law_1.01,1.846067237854004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,8,power_law_1.01,2.631475257873535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,8,power_law_1.01,3.8203392028808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,4,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,4,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,4,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,4,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,4,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,4,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,4,power_law_1.2,0.10670080184936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,4,power_law_1.2,0.08622080087661743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,4,power_law_1.2,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,4,power_law_1.2,0.10219520330429077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,4,power_law_1.2,0.0886784017086029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,4,power_law_1.2,0.10342400074005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,4,power_law_1.2,0.15872000455856322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,4,power_law_1.2,0.15667200088500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,4,power_law_1.2,0.18821120262145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,4,power_law_1.2,0.19189759492874145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,4,power_law_1.2,0.20254719257354736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,4,power_law_1.2,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,4,power_law_1.2,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,4,power_law_1.2,0.31395840644836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,4,power_law_1.2,0.36229119300842283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,4,power_law_1.2,0.43683838844299316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,4,power_law_1.2,0.5490623950958252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,4,power_law_1.2,0.8347647666931153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,4,power_law_1.2,1.1409407615661622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,4,power_law_1.2,1.7897279739379883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,4,power_law_1.2,2.2024192810058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,32,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,32,balanced,0.0452106644709905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,32,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,32,balanced,0.2141546607017517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,32,balanced,0.30037333567937213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,32,balanced,0.3020799954732259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,32,balanced,0.30395734310150146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,32,balanced,0.30481066306432086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,32,balanced,0.3058346708615621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,32,balanced,0.3068586587905884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,32,balanced,0.3089066743850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,32,balanced,0.3136853377024333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,32,balanced,0.3160746693611145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,32,balanced,0.318122665087382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,32,balanced,0.3264853358268738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,32,balanced,0.3314346671104431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,32,balanced,0.34167468547821045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,32,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,32,balanced,0.381440003712972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,32,balanced,0.408405343691508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,32,balanced,0.45926400025685626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,32,balanced,0.5616639852523804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,32,balanced,0.5922133525212606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,32,balanced,0.725162665049235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,32,balanced,0.8965120315551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,32,balanced,1.3335893948872883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,32,balanced,1.7491626739501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,1,power_law_1.2,13.682278442382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,128,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,128,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,128,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,128,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,128,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,128,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,128,balanced,0.23381332556406656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,128,balanced,0.23586134115854898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,128,balanced,0.23705599705378214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,128,balanced,0.23808000485102335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,128,balanced,0.24081067244211832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,128,balanced,0.2445653279622396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,128,balanced,0.24661332368850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,128,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,128,balanced,0.25924267371495563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,128,balanced,0.26385066906611127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,4,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,128,balanced,0.27665066719055176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,128,balanced,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,128,balanced,0.3189493417739868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,128,balanced,0.36300798257191974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,128,balanced,0.4082346757253011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,128,balanced,0.4843519926071167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,128,balanced,0.5661013523737589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,4,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,4,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,4,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,128,balanced,0.7662933667500814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,4,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,4,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,4,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,4,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,4,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,4,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,128,balanced,0.9188693364461263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,4,balanced,0.056143999099731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,4,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,4,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,4,balanced,0.062122667829195656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,4,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,4,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,128,balanced,1.2895466486612956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,4,balanced,0.07355733215808868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,4,balanced,0.08703999718030293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,4,balanced,0.17902400096257529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,4,balanced,0.22561599810918173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,4,balanced,0.31163734197616577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,128,balanced,1.711616039276123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,4,balanced,0.40140799681345624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,4,balanced,0.6463146607081095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,4,balanced,0.9323519865671793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,4,balanced,1.5063039461771648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,4,balanced,2.0727465947469077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,8,power_law_1.2,0.02802560031414032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,8,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,8,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,8,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,8,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,8,power_law_1.2,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,8,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,8,power_law_1.2,0.036236798763275145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,8,power_law_1.2,0.039289599657058714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,8,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,8,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,8,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,8,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,8,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,8,power_law_1.2,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,8,power_law_1.2,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,8,power_law_1.2,0.1689471960067749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,8,power_law_1.2,0.19824639558792115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,8,power_law_1.2,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,8,power_law_1.2,0.313753604888916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,8,power_law_1.2,0.6039552211761474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,8,power_law_1.2,0.5957632064819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,8,power_law_1.2,1.1290623664855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,8,power_law_1.2,1.5714303970336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,16,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,16,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,16,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,16,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,16,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,16,balanced,0.19011199474334717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,16,balanced,0.1909760038057963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,16,balanced,0.21452800432840982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,16,balanced,0.19234132766723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,16,balanced,0.1925119956334432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,16,balanced,0.19404800732930502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,16,balanced,0.19541333119074503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,16,balanced,0.1960960030555725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,16,balanced,0.1976319948832194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,16,balanced,0.20104533433914185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,16,balanced,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,16,balanced,0.2070186734199524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,16,balanced,0.21760000785191855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,16,balanced,0.22715733448664346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,16,balanced,0.24302933613459268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,16,balanced,0.253440002600352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,16,balanced,0.29764266808827716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,16,balanced,0.3206826647122701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,16,balanced,0.40243200461069745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,16,balanced,0.44680531819661456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,16,balanced,0.6946132977803549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,16,balanced,0.9316693147023519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,64,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,64,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,64,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,64,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,64,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,64,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,64,power_law_1.2,0.03214080035686493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,64,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,64,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,64,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,64,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,64,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,64,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,64,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,64,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,64,power_law_1.2,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,64,power_law_1.2,0.12984319925308227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,64,power_law_1.2,0.16814080476760865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,64,power_law_1.2,0.2504703998565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,64,power_law_1.2,0.4143104076385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,64,power_law_1.2,0.6684671878814697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,64,power_law_1.2,0.9656319618225098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,64,power_law_1.2,1.3729791641235352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,4,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,4,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,4,balanced,0.03855466594298681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,4,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,4,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,4,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,4,balanced,0.044026667873064675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,4,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,4,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,4,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,4,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,4,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,4,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,4,balanced,0.07797866563002269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,4,balanced,0.08071466783682506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,4,balanced,0.09454933802286784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,4,balanced,0.1109333336353302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,4,balanced,0.13482667009035745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,4,balanced,0.2404586672782898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,4,balanced,0.2884053389231364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,4,balanced,0.429909348487854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,4,balanced,0.5420053402582804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,4,balanced,0.8970239957173666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,4,balanced,1.223680019378662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,4,balanced,1.7940479914347331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,4,balanced,2.4000746409098306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,1,power_law_1.01,1.064748764038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,1,power_law_1.01,2.0885503768920897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,1,power_law_1.01,4.033945465087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,1,power_law_1.01,7.998668670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,64,power_law_1.2,1.7971200942993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,1,power_law_1.01,14.418124389648437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,1,power_law_1.01,20.98462677001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,1,power_law_1.01,24.596275329589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,1,power_law_1.01,31.672933959960936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,1,power_law_1.01,32.46940307617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,1,power_law_1.01,34.19195556640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,1,power_law_1.01,34.93232727050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,1,power_law_1.01,36.61226806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,1,power_law_1.01,37.1736572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,1,power_law_1.01,39.070925903320315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,1,power_law_1.01,39.26384582519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.3053567886352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.4782080173492432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.6270976066589355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,1,power_law_1.2,1.1063296318054199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,1,power_law_1.2,1.191321563720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,1,power_law_1.2,1.2621824264526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,1,power_law_1.2,1.2824576377868653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,1,power_law_1.2,1.3551615715026855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,1,power_law_1.01,40.67164306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,1,power_law_1.2,1.358016014099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,1,power_law_1.2,1.4256128311157226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,1,power_law_1.2,1.4520319938659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,1,power_law_1.2,1.507091236114502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,1,power_law_1.2,1.5730496406555177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,1,power_law_1.2,1.6021503448486327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,1,power_law_1.2,1.6785408020019532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,1,power_law_1.2,1.8374656677246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,1,power_law_1.2,2.047385597229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,1,power_law_1.2,2.4215551376342774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,1,power_law_1.2,2.7834367752075195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,1,power_law_1.2,3.6075519561767577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,1,power_law_1.2,4.315750503540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,1,power_law_1.01,42.91502075195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,1,power_law_1.2,6.081126403808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,1,power_law_1.2,7.660543823242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,1,power_law_1.01,47.03846435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,1,power_law_1.2,11.025408172607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,16,power_law_1.01,0.039110401272773744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,16,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,16,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,16,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,16,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,16,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,16,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,16,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,16,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,16,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,16,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,16,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,16,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,1,power_law_1.01,46.15679931640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,16,power_law_1.01,0.04647679924964905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,16,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,16,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,16,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,16,power_law_1.01,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,16,power_law_1.01,0.0886784017086029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,16,power_law_1.01,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,16,power_law_1.01,0.18534400463104247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,16,power_law_1.01,0.2521087884902954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,16,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,16,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,16,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,16,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,16,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,16,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,16,power_law_1.01,0.5148672103881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,16,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,16,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,16,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,16,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,16,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,16,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,16,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,16,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,16,power_law_1.01,0.8366080284118652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,16,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,16,balanced,0.04573333263397217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,16,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,16,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,16,balanced,0.05973333120346069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,16,balanced,0.07202133536338806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,16,balanced,0.0846506655216217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,16,power_law_1.01,1.0971136093139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,16,balanced,0.11315199732780457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,16,balanced,0.2198186715443929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,16,balanced,0.31726932525634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,16,balanced,0.40908801555633545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,16,balanced,0.6275413433710734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,16,balanced,0.8780799706776937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,1,power_law_1.01,49.82987670898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,2,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,2,power_law_1.01,0.02640640139579773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,2,power_law_1.01,0.026617598533630372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,2,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,2,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,1,power_law_1.2,14.340301513671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,2,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,2,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,2,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,2,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,2,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,2,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,2,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,2,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,2,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,2,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,2,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,2,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,2,power_law_1.01,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,1,power_law_1.01,53.86997680664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,8,power_law_1.2,0.18862080574035645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,8,power_law_1.2,0.35143680572509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,8,power_law_1.2,0.3792896032333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,8,power_law_1.2,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,8,power_law_1.2,0.5482495784759521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,8,power_law_1.2,0.5914624214172364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,2,power_law_1.01,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,8,power_law_1.2,0.572211217880249
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,8,power_law_1.2,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,8,power_law_1.2,0.5931007862091064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,2,power_law_1.01,0.130457603931427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,8,power_law_1.2,0.618291187286377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,8,power_law_1.2,0.5941247940063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,8,power_law_1.2,0.6090752124786377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,8,power_law_1.2,0.6190976142883301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,8,power_law_1.2,0.6334464073181152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,2,power_law_1.01,0.1482751965522766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,8,power_law_1.2,0.6905856132507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,8,power_law_1.2,0.6672383785247803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,2,power_law_1.01,0.30208001136779783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,8,power_law_1.2,0.6871039867401123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,8,power_law_1.2,0.7176191806793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,8,power_law_1.2,0.758784008026123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,8,power_law_1.2,0.7989247798919678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,8,power_law_1.2,0.9220095634460449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,8,power_law_1.2,1.1266048431396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,8,power_law_1.2,1.3645824432373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,8,power_law_1.2,1.8544639587402343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,8,power_law_1.2,2.081177520751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,8,power_law_1.2,2.841600036621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,1,power_law_1.01,59.42393188476562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,8,power_law_1.2,3.486310577392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,2,power_law_1.01,0.3999743938446045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,2,power_law_1.01,0.6400000095367432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,1,power_law_1.01,62.483453369140626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,2,power_law_1.01,0.8687616348266601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,1,power_law_1.01,74.79603271484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,2,power_law_1.01,1.236780834197998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,1,power_law_1.01,85.22076416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,1,power_law_1.01,101.2684814453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,2,power_law_1.01,2.02608642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,1,power_law_1.01,102.9056884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,1,power_law_1.2,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,1,power_law_1.2,0.6776832103729248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,1,power_law_1.2,1.3008895874023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,1,power_law_1.2,2.3353343963623048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,1,power_law_1.2,3.5251903533935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,1,power_law_1.2,4.539174270629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,1,power_law_1.2,7.017266845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,1,power_law_1.2,7.409241485595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,1,power_law_1.2,7.87066879272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,1,power_law_1.2,7.823359680175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,1,power_law_1.2,8.307917022705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,1,power_law_1.2,8.473804473876953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,1,power_law_1.2,8.902041625976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,1,power_law_1.2,9.149644470214843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,1,power_law_1.2,9.29278106689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,1,power_law_1.2,9.68089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,1,power_law_1.2,9.866854095458985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,1,power_law_1.2,10.280550384521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,16,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,16,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,16,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,16,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,16,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,16,power_law_1.2,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,16,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,16,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,16,power_law_1.2,0.03643519878387451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,1,power_law_1.2,10.668646240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,16,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,16,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,16,power_law_1.2,0.04687359929084778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,16,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,16,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,16,power_law_1.2,0.07639039754867553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,16,power_law_1.2,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,16,power_law_1.2,0.117740797996521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,16,power_law_1.2,0.18247679471969605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,16,power_law_1.2,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,1,power_law_1.2,10.996530914306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,16,power_law_1.2,0.3096575975418091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,16,power_law_1.2,0.4016128063201904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,16,power_law_1.2,0.5681151866912841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,1,power_law_1.2,11.681177520751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,16,power_law_1.2,0.7571455955505371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,1,power_law_1.2,13.24523468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,16,power_law_1.2,1.2547967910766602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.32030720710754396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.5496831893920898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,1,power_law_1.01,1.0522624015808106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,16,power_law_1.2,1.688140869140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,1,power_law_1.01,2.029567909240723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,1,power_law_1.2,14.9225341796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,1,power_law_1.01,3.666944122314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,1,power_law_1.01,5.15153923034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,1,power_law_1.01,6.0637054443359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,1,power_law_1.2,18.757221984863282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,1,power_law_1.01,7.936614227294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,1,power_law_1.01,8.370995330810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,1,power_law_1.2,19.100262451171876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,4,power_law_1.2,1.0610688209533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,4,power_law_1.2,2.013382339477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,1,power_law_1.01,8.71014404296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,4,power_law_1.2,2.3293888092041017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,4,power_law_1.2,3.2489471435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,1,power_law_1.01,8.84326400756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,4,power_law_1.2,3.941580963134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,4,power_law_1.2,4.918067169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,1,power_law_1.01,9.422233581542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,1,power_law_1.2,24.96942138671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,4,power_law_1.2,6.475775909423828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,1,power_law_1.01,9.545728302001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,4,power_law_1.2,6.0493824005126955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,4,power_law_1.2,6.836224365234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,1,power_law_1.01,9.791487884521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,16,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,16,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,16,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,16,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,16,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,16,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,16,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,16,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,16,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,16,balanced,0.03600533306598663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,16,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,16,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,16,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,16,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,4,power_law_1.2,6.790962982177734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,16,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,16,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,16,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,16,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,16,balanced,0.11724799871444702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,16,balanced,0.15479466319084167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,16,balanced,0.24388267596562704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,1,power_law_1.2,29.684121704101564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,16,balanced,0.2525866627693176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,16,balanced,0.37614933649698895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,1,power_law_1.01,10.119776153564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,16,balanced,0.46779731909434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,4,power_law_1.2,6.699622344970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,16,balanced,0.7621973355611166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,16,balanced,1.0164906978607178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,4,power_law_1.2,6.794445037841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,1,power_law_1.01,10.52938232421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,4,power_law_1.2,6.902988433837891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,1,power_law_1.01,10.791731262207032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,4,power_law_1.2,7.249305725097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,4,power_law_1.2,7.567974090576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,1,power_law_1.01,11.46982421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,4,power_law_1.2,7.973887634277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,1,power_law_1.01,12.105522918701173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,4,power_law_1.2,8.396390533447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,1,power_law_1.01,13.031423950195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,4,power_law_1.2,8.843878173828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,4,power_law_1.2,9.061376190185547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,1,power_law_1.01,13.567385864257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,4,power_law_1.2,9.702400207519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,1,power_law_1.01,15.077171325683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,4,power_law_1.2,10.122637176513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,4,power_law_1.2,11.083776092529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,1,power_law_1.01,15.860121154785157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,4,power_law_1.2,12.538470458984374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,1,power_law_1.01,18.744114685058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,8,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,8,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,8,power_law_1.2,0.19107840061187745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,8,power_law_1.2,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,8,power_law_1.2,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,4,power_law_1.2,15.584870910644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,8,power_law_1.2,0.2125823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,8,power_law_1.2,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,8,power_law_1.2,0.22425599098205568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,8,power_law_1.2,0.22671360969543458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,8,power_law_1.2,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,8,power_law_1.2,0.23470079898834229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,8,power_law_1.2,0.2357248067855835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,8,power_law_1.2,0.24842240810394287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,1,power_law_1.01,21.694668579101563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,8,power_law_1.2,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,8,power_law_1.2,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,8,power_law_1.2,0.2549760103225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,4,power_law_1.2,17.440357971191407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,8,power_law_1.2,0.2742271900177002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,8,power_law_1.2,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,8,power_law_1.2,0.3493824005126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,8,power_law_1.2,0.3794944047927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,8,power_law_1.2,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,4,power_law_1.2,24.554899597167967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,1,power_law_1.01,29.372824096679686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,8,power_law_1.2,0.6662144184112548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,8,power_law_1.2,0.8249343872070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,1,power_law_1.01,31.5641845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,4,power_law_1.2,34.62675170898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,8,power_law_1.2,1.1429887771606446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,8,power_law_1.2,1.8384895324707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,8,power_law_1.2,2.392473602294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,64,power_law_1.01,0.6039552211761474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,64,power_law_1.01,0.5543935775756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,64,power_law_1.01,0.5552127838134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,64,power_law_1.01,0.5556223869323731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,64,power_law_1.01,0.4554751873016357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,64,power_law_1.01,0.522649621963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,64,power_law_1.01,0.5527552127838135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,64,power_law_1.01,0.5453824043273926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,64,power_law_1.01,0.5468160152435303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,64,power_law_1.01,0.5375999927520752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,64,power_law_1.01,0.5371903896331787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,64,power_law_1.01,0.5548031806945801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,64,power_law_1.01,0.5246975898742676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,64,power_law_1.01,0.5646336078643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,64,power_law_1.01,0.5574656009674073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,64,power_law_1.01,0.5971583843231201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,64,power_law_1.01,0.5892096042633057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,64,power_law_1.01,0.595136022567749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,64,power_law_1.01,0.6684671878814697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,64,power_law_1.01,0.7858176231384277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,64,power_law_1.01,0.9723648071289063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,64,power_law_1.01,1.3205504417419434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,64,power_law_1.01,1.3645824432373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,64,power_law_1.01,1.8704383850097657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,64,power_law_1.01,2.5028608322143553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,64,power_law_1.01,3.396198272705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,64,power_law_1.01,4.192460632324218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,4,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,4,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,4,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,4,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,4,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,4,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,4,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,4,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,4,balanced,0.033439998825391136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,4,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,4,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,4,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,4,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,4,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,4,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,4,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,4,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,4,balanced,0.07611733178297679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,4,balanced,0.08789333701133728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,4,balanced,0.1353386640548706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,4,balanced,0.22033067544301352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,4,balanced,0.3466240167617798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,4,balanced,0.4374186595280965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,4,balanced,0.6775466601053873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,4,balanced,0.9400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,4,balanced,1.444170633951823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,4,balanced,1.9473066329956055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,8,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,8,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,8,power_law_1.2,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,8,power_law_1.2,0.06653439998626709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,8,power_law_1.2,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,8,power_law_1.2,0.10772479772567749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,8,power_law_1.2,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,8,power_law_1.2,0.11772160530090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,8,power_law_1.2,0.15749119520187377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,8,power_law_1.2,0.18903039693832396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,8,power_law_1.2,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,8,power_law_1.2,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,8,power_law_1.2,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,8,power_law_1.2,0.20787200927734376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,8,power_law_1.2,0.24289278984069823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,8,power_law_1.2,0.232857608795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,8,power_law_1.2,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,8,power_law_1.2,0.3057663917541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,8,power_law_1.2,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,8,power_law_1.2,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,8,power_law_1.2,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,8,power_law_1.2,0.5890048027038575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,8,power_law_1.2,0.8449919700622559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,8,power_law_1.2,1.4270463943481446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,8,power_law_1.2,1.831110382080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,8,power_law_1.01,0.23941121101379395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,8,power_law_1.01,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,8,power_law_1.01,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,8,power_law_1.01,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,8,power_law_1.01,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,8,power_law_1.01,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,8,power_law_1.01,0.24944639205932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,8,power_law_1.01,0.25207040309906004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,8,power_law_1.01,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,8,power_law_1.01,0.2711551904678345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,8,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,8,power_law_1.01,0.33280000686645506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,8,power_law_1.01,0.3788800001144409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,8,power_law_1.2,2.988627243041992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,8,power_law_1.01,0.3516416072845459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,8,power_law_1.01,0.3960832118988037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,1,power_law_1.2,0.050361597537994386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,8,power_law_1.01,0.4976640224456787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,1,power_law_1.2,0.23797760009765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,1,power_law_1.2,0.4310719966888428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,8,power_law_1.01,0.5805952072143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,1,power_law_1.2,0.5974016189575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,1,power_law_1.2,0.7944191932678223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,1,power_law_1.2,1.47128324508667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,8,power_law_1.01,0.7663424015045166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,1,power_law_1.2,1.5286272048950196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,1,power_law_1.2,1.6107519149780274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,1,power_law_1.2,1.6664575576782226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,8,power_law_1.01,0.9687040328979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,1,power_law_1.2,1.656825637817383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,1,power_law_1.2,1.7313791275024415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,1,power_law_1.2,1.7313472747802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,1,power_law_1.2,1.759846305847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,1,power_law_1.2,1.8300928115844726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,8,power_law_1.01,1.3811712265014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,1,power_law_1.2,1.8581504821777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,1,power_law_1.2,1.886195182800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,1,power_law_1.2,1.9296255111694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,1,power_law_1.2,2.059878349304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,8,power_law_1.2,3.457843017578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,1,power_law_1.2,2.1590015411376955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,1,power_law_1.2,2.428108787536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,8,power_law_1.01,1.6574464797973634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,1,power_law_1.2,2.762931251525879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,1,power_law_1.2,3.370188903808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,8,power_law_1.01,2.243174362182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,1,power_law_1.2,4.097024154663086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,8,power_law_1.01,3.1879167556762695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,1,power_law_1.2,5.339750289916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,8,power_law_1.01,4.628684616088867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,4,balanced,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,4,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,4,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,4,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,4,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,4,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,4,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,4,balanced,0.03685333331425985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,4,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,4,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,4,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,4,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,4,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,4,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,4,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,4,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,4,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,4,balanced,0.06843733290831248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,4,balanced,0.07594666878382365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,4,balanced,0.18568533658981323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,4,balanced,0.2244266668955485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,4,balanced,0.27357866366704303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,4,balanced,0.31197333335876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,4,balanced,0.4217173258463542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,4,balanced,0.5471573273340861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,4,balanced,0.8963306744893392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,4,balanced,1.2431360085805256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,1,power_law_1.2,6.236979293823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,8,power_law_1.01,6.147686386108399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,8,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,8,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,8,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,8,balanced,0.2362026572227478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,8,balanced,0.45158398151397705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,8,balanced,0.45448533693949383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,8,balanced,0.45585068066914874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,8,balanced,0.45772798856099445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,8,balanced,0.45875199635823566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,8,balanced,0.4601173400878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,8,balanced,0.46301865577697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,8,balanced,0.46745598316192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,8,balanced,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,8,balanced,0.4746239980061849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,8,balanced,0.48366932074228924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,8,balanced,0.48793598016103107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,8,balanced,0.497322678565979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,8,balanced,0.5179733435312907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,8,balanced,0.5249706506729126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,8,power_law_1.01,8.518656158447266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,8,balanced,0.5730986595153809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,8,balanced,0.5886293252309164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,8,balanced,0.6710613568623861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,8,balanced,0.7662933667500814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,8,balanced,1.0079572995503743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,8,balanced,1.274880011876424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,8,balanced,1.90993070602417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,8,balanced,2.5031679471333823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,1,power_law_1.2,8.83609619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,4,power_law_1.2,0.2727936029434204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,4,power_law_1.2,0.4247551918029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,4,power_law_1.2,0.37212159633636477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,4,power_law_1.2,0.4642816066741943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,4,power_law_1.2,0.4655104160308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,4,power_law_1.2,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,4,power_law_1.2,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,4,power_law_1.2,0.4777984142303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,4,power_law_1.2,0.5363711833953857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,4,power_law_1.2,0.5038080215454102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,4,power_law_1.2,0.5478400230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,4,power_law_1.2,0.597811222076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,4,power_law_1.2,0.6436863899230957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,4,power_law_1.2,0.7081984043121338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,4,power_law_1.2,0.7589888095855712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,4,power_law_1.2,0.830668830871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,4,power_law_1.2,0.8876031875610352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,4,power_law_1.2,1.0786815643310548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,4,power_law_1.2,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,4,power_law_1.2,1.7653696060180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,4,power_law_1.2,2.392678451538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,1,balanced,0.0628053347269694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,1,balanced,0.06843199829260509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,1,balanced,0.0890880028406779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,1,balanced,0.2797226707140605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,1,balanced,0.5319679975509644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,1,balanced,1.0294613043467205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,1,balanced,1.0402080217997234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,1,balanced,1.0466986497243245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,1,balanced,1.0582773685455322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,8,power_law_1.01,11.215245056152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,1,balanced,1.0673226515452068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,1,balanced,1.088853359222412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,1,balanced,1.1101653575897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,1,balanced,1.1287840207417805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,1,balanced,1.1712799866994221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,1,balanced,1.223680019378662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,1,balanced,1.2615679899851482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,1,balanced,1.354922612508138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,1,balanced,1.5767626762390137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,1,balanced,1.7829546928405762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,1,balanced,2.1700266202290854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,1,balanced,2.603520075480143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,1,balanced,3.5314133961995444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,1,balanced,4.457098642985026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,4,power_law_1.2,3.01977596282959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,1,balanced,6.309546788533528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,1,balanced,8.135679880777994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,1,balanced,11.830101013183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,1,balanced,15.434752146402994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,1,power_law_1.2,11.431321716308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,4,power_law_1.2,3.871744155883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,4,power_law_1.2,7.17496337890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,4,power_law_1.2,8.199372863769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,4,balanced,0.22646933794021606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,4,balanced,0.4210346539815267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,4,balanced,0.7927467028299967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,4,balanced,1.5506772994995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,4,balanced,2.9009920756022134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,4,balanced,4.078421274820964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,4,balanced,4.092927932739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,4,balanced,4.056405385335286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,4,balanced,4.072106679280599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,4,balanced,4.08405335744222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,4,balanced,4.108288129170735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,4,balanced,4.128938674926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,4,balanced,4.149759928385417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,4,balanced,4.187477429707845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,4,balanced,4.22109858194987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,4,balanced,4.248746554056804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,4,balanced,4.313088099161784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,4,balanced,4.441770553588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,4,balanced,4.600831985473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,4,balanced,4.842837333679199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,4,balanced,4.959402720133464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,4,balanced,5.312170664469401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,4,balanced,5.6371199289957685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,4,balanced,7.057749430338542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,4,balanced,7.83359972635905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,4,balanced,12.034384409586588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,4,balanced,13.417301177978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,4,power_law_1.2,11.192320251464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,16,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,16,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,16,power_law_1.2,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,16,power_law_1.2,0.21524479389190673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,16,power_law_1.2,0.20541439056396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,16,power_law_1.2,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,16,power_law_1.2,0.11571199893951416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,16,power_law_1.2,0.17059839963912965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,16,power_law_1.2,0.18063360452651978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,16,power_law_1.2,0.1112064003944397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,16,power_law_1.2,0.1411072015762329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,16,power_law_1.2,0.1773568034172058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,16,power_law_1.2,0.16997120380401612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,16,power_law_1.2,0.19578880071640015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,16,power_law_1.2,0.18165760040283202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,16,power_law_1.2,0.21524479389190673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,16,power_law_1.2,0.22527999877929689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,16,power_law_1.2,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,16,power_law_1.2,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,16,power_law_1.2,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,16,power_law_1.2,0.3663872003555298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,16,power_law_1.2,0.5183487892150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,16,power_law_1.2,0.6764544010162353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,16,power_law_1.2,1.225932788848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,16,power_law_1.2,1.5108096122741699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,16,power_law_1.2,2.5337856292724608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,16,power_law_1.2,3.199385643005371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,8,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,8,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,8,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,8,balanced,0.1621333360671997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,8,balanced,0.3500373363494873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,8,balanced,0.6761813163757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,8,balanced,0.7033173243204752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,8,balanced,0.6702079772949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,8,balanced,0.6720853646596273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,8,balanced,0.6737919648488363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,8,balanced,0.6782293319702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,8,balanced,0.6818133195241293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,8,balanced,0.6841973463694254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,8,balanced,0.6896639664967855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,8,balanced,0.6971733570098877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,8,balanced,0.702122688293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,8,balanced,0.7145813306172689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,8,balanced,0.7427413463592529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,8,balanced,0.7613440354665121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,8,balanced,0.7543360392252604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,8,balanced,0.803663969039917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,8,balanced,0.881493330001831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,8,balanced,0.9485653241475424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,8,balanced,1.1246933142344158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,8,balanced,1.2677120367685955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,8,balanced,1.6597332954406738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,8,balanced,2.092202663421631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,64,balanced,0.02199466774861018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,64,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,64,balanced,0.021829334398110706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,64,balanced,0.02199999988079071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,64,balanced,0.022495999932289124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,64,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,64,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,64,balanced,0.023546665906906128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,64,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,64,balanced,0.023711999257405598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,64,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,64,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,64,balanced,0.024714666108290356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,64,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,64,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,64,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,64,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,64,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,64,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,64,balanced,0.05136000116666158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,64,balanced,0.07048533360163371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,64,balanced,0.13567999998728433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,64,balanced,0.274944007396698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,64,balanced,0.37768534819285077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,128,balanced,0.020821332931518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,128,balanced,0.020309332758188248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,128,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,128,balanced,0.020303999384244282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,128,balanced,0.02065066620707512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,128,balanced,0.021333334346612293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,128,balanced,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,128,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,128,balanced,0.022181332111358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,128,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,128,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,128,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,128,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,128,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,128,balanced,0.0283146674434344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,128,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,128,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,128,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,128,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,128,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,128,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,128,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,128,balanced,0.049471999208132424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,128,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,128,balanced,0.10308266679445903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,128,balanced,0.1599146624406179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,4,power_law_1.2,17.476608276367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,64,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,64,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,64,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,64,balanced,0.044346665342648826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,64,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,64,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,64,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,64,balanced,0.0525546669960022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,64,balanced,0.05373333394527435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,64,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,64,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,64,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,64,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,64,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,64,balanced,0.09250133236249287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,64,balanced,0.12390399972597758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,64,balanced,0.16793600718180338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,64,balanced,0.21248000860214233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,64,balanced,0.2302239934603373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,64,balanced,0.27187200387318927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,64,balanced,0.3155626654624939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,64,balanced,0.3862186670303345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,64,balanced,0.46882132689158124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,64,balanced,0.6543360153834025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,64,balanced,0.8152746359507242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,64,balanced,1.1983946959177654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,64,balanced,1.5634560585021973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,2,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,2,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,2,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,2,balanced,0.041109333435694374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,2,balanced,0.04145599901676178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,2,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,2,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,2,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,2,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,2,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,2,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,2,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,2,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,2,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,2,balanced,0.07577600081761678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,2,balanced,0.07765333354473114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,2,balanced,0.0955466628074646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,2,balanced,0.11588266491889954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,2,balanced,0.17698132991790771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,2,balanced,0.2539520064989726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,2,balanced,0.30957333246866864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,2,balanced,0.47786664962768555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,2,balanced,0.6869333585103353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,2,balanced,1.0900479952494304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,2,balanced,1.4881812731424968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,2,balanced,2.2005759874979653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,2,balanced,2.9564587275187173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,2,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,2,balanced,0.04897066454092661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,2,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,2,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,2,balanced,0.08362666765848796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,2,balanced,0.2983253399531047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,2,balanced,0.3022506634394328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,2,balanced,0.29334932565689087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,2,balanced,0.3130026658376058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,2,balanced,0.30292266607284546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,2,balanced,0.3092479904492696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,2,balanced,0.3201706608136495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,2,balanced,0.32614399989446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,2,balanced,0.3403093417485555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,2,balanced,0.3771573305130005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,2,balanced,0.3696639935175578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,2,balanced,0.3957759936650594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,2,balanced,0.45260798931121826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,2,balanced,0.5278720060984293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,2,balanced,0.7024640242258707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,2,balanced,0.8937813440958658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,2,balanced,1.2701013088226318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,2,balanced,1.6829439798990886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,2,balanced,2.4789172808329263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,2,balanced,3.3249279657999673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,2,balanced,5.02510929107666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,2,balanced,6.62118403116862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,16,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,16,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,16,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,16,balanced,0.2853546738624573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,16,balanced,0.5492053429285685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,16,balanced,1.0548906326293945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,16,balanced,1.561087926228841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,16,balanced,1.5397547086079915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,16,balanced,1.5419732729593914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,16,balanced,1.5725226402282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,16,balanced,1.5438507397969563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,16,balanced,1.5508480072021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,16,balanced,1.5520426432291667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,16,balanced,1.5617705980936687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,16,balanced,1.5716692606608074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,16,balanced,1.5749120712280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,16,balanced,1.5938560167948406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,16,balanced,1.6295253435770671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,16,balanced,1.6776533126831055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,4,power_law_1.01,0.20828158855438234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,16,balanced,1.7338026364644368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,4,power_law_1.01,0.35573759078979494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,16,balanced,1.7855146725972493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,4,power_law_1.01,0.4671487808227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,16,balanced,1.8781812985738118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,4,power_law_1.01,0.6172671794891358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,4,power_law_1.01,0.7391232013702392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,4,power_law_1.01,0.842956829071045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,4,power_law_1.01,1.174732780456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,16,balanced,2.054138660430908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,4,power_law_1.01,1.0108799934387207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,16,balanced,2.2302719751993814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,4,power_law_1.01,1.1997183799743651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,4,power_law_1.01,1.095680046081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,16,balanced,2.409301280975342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,4,power_law_1.01,1.2011520385742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,16,balanced,3.017727851867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,4,power_law_1.01,1.1370495796203612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,4,power_law_1.01,1.1960320472717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,16,balanced,3.5631786982218423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,4,power_law_1.01,1.2333056449890136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,4,power_law_1.01,1.2312576293945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,4,power_law_1.01,1.2926976203918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,4,power_law_1.01,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,4,power_law_1.01,1.3170687675476074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,4,power_law_1.01,1.3406208038330079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,4,power_law_1.01,1.4817279815673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,32,power_law_1.01,0.5556223869323731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,4,power_law_1.01,1.6138240814208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,32,power_law_1.01,0.5529407978057861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,4,power_law_1.01,1.7905664443969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,32,power_law_1.01,0.5519360065460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,32,power_law_1.01,0.5461887836456298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,4,power_law_1.01,2.0545536041259767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,32,power_law_1.01,0.5539840221405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,32,power_law_1.01,0.49684481620788573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,4,power_law_1.01,2.6238975524902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,32,power_law_1.01,0.49295358657836913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,32,power_law_1.01,0.5203968048095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,4,power_law_1.01,2.9992767333984376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,32,power_law_1.01,0.5277696132659913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,32,power_law_1.01,0.5191679954528808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,32,power_law_1.01,0.5435391902923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,32,power_law_1.01,0.520192003250122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,4,power_law_1.01,4.0871936798095705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,32,power_law_1.01,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,32,power_law_1.01,0.5697535991668701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,32,power_law_1.01,0.5634047985076904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,32,power_law_1.01,0.5660672187805176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,32,power_law_1.01,0.5648320198059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,4,power_law_1.01,5.3377025604248045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,32,power_law_1.01,0.6309887886047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,32,power_law_1.01,0.6737919807434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,32,power_law_1.01,0.7718912124633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,32,power_law_1.01,0.8927231788635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,32,power_law_1.01,1.204428768157959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,32,power_law_1.01,1.157529640197754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,32,power_law_1.01,1.7321983337402345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,32,power_law_1.01,2.057625579833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,64,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,64,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,64,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,64,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,64,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,32,power_law_1.01,2.9077503204345705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,64,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,64,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,64,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,64,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,64,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,64,power_law_1.2,0.026393601298332216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,64,power_law_1.2,0.026393601298332216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,32,power_law_1.01,4.158464050292968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,64,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,2,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,2,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,64,power_law_1.2,0.03294079899787903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,2,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,2,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,2,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,2,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,64,power_law_1.2,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,2,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,2,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,2,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,64,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,2,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,2,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,2,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,64,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,2,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,2,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,2,balanced,0.08157866696516673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,2,balanced,0.09113599856694539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,64,power_law_1.2,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,2,balanced,0.11895466844240825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,2,balanced,0.18210132916768393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,2,balanced,0.1967786749204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,2,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,64,power_law_1.2,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,2,balanced,0.3290453354517619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,64,power_law_1.2,0.12943359613418579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,2,balanced,0.4599466721216838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,2,balanced,0.617301344871521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,64,power_law_1.2,0.1789952039718628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,2,balanced,0.973311980565389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,2,balanced,1.3494613965352376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,2,balanced,2.136890729268392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,2,power_law_1.01,0.316211199760437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,64,power_law_1.2,0.3289088010787964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,2,balanced,2.920106569925944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,2,power_law_1.01,0.547430419921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,2,power_law_1.01,1.0479616165161132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,2,power_law_1.01,1.319321632385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,64,power_law_1.2,0.41205759048461915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,2,power_law_1.01,2.188697624206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,2,power_law_1.01,2.859417533874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,2,power_law_1.01,3.4816001892089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,2,power_law_1.01,4.483481597900391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,2,power_law_1.01,4.1885631561279295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,2,power_law_1.01,4.695244979858399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,2,power_law_1.01,4.792319869995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,2,power_law_1.01,4.805427169799804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,2,power_law_1.01,4.739072036743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,64,power_law_1.2,0.6078464031219483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,2,power_law_1.01,5.136383819580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,2,power_law_1.01,4.827135848999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,2,power_law_1.01,5.158911895751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,2,power_law_1.01,5.4505470275878904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,2,power_law_1.01,5.7837566375732425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,2,power_law_1.01,5.898035049438477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,2,power_law_1.01,6.513254547119141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,2,power_law_1.01,6.971186828613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,2,power_law_1.01,7.688396453857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,2,power_law_1.01,8.10598373413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,2,power_law_1.01,9.848422241210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,2,power_law_1.01,11.445247650146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,2,power_law_1.01,15.09171142578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,64,power_law_1.2,0.940236759185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,2,power_law_1.01,17.248870849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,128,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,128,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,128,balanced,0.04862933357556661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,128,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,128,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,128,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,128,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,128,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,128,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,128,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,128,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,128,balanced,0.05748266478379568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,128,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,128,balanced,0.05851200222969055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,128,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,128,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,128,balanced,0.06946133573849995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,128,balanced,0.0936959981918335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,128,balanced,0.11281067132949829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,128,balanced,0.1699840029080709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,128,balanced,0.2152106761932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,128,balanced,0.2867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,128,balanced,0.3245866696039836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,128,balanced,0.38997332255045575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,128,balanced,0.43143999576568604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,128,balanced,0.607744018236796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,128,balanced,0.7833600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,2,power_law_1.2,0.24227840900421144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,2,power_law_1.2,0.33013119697570803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,2,power_law_1.2,0.47616000175476075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,2,power_law_1.2,0.6721536159515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,2,power_law_1.2,0.9650176048278809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,2,power_law_1.2,1.4800895690917968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,2,power_law_1.2,1.5245311737060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,2,power_law_1.2,1.6109567642211915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,2,power_law_1.2,1.6549888610839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,2,power_law_1.2,1.679769515991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,2,power_law_1.2,1.6846847534179688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,2,power_law_1.2,1.6891904830932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,2,power_law_1.2,1.7362943649291993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,2,power_law_1.2,1.760256004333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,2,power_law_1.2,1.8378751754760743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,2,power_law_1.2,1.8546688079833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,2,power_law_1.2,1.8894847869873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,2,power_law_1.2,1.9736576080322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,2,power_law_1.2,2.1037055969238283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,2,power_law_1.2,2.369945526123047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,2,power_law_1.2,2.6626047134399413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,2,power_law_1.2,3.285395050048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,2,power_law_1.2,4.112384033203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,2,power_law_1.2,5.16503677368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,2,power_law_1.2,6.288793563842773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,1,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,1,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,1,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,1,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,1,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,1,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,1,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,1,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,1,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,1,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,1,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,1,power_law_1.2,0.04360319972038269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,1,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,1,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,1,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,1,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,1,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,1,power_law_1.2,0.09400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,1,power_law_1.2,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,1,power_law_1.2,0.21176319122314452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,2,power_law_1.2,8.455372619628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,1,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,8,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,8,power_law_1.01,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,8,power_law_1.01,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,8,power_law_1.01,0.4853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,8,power_law_1.01,0.5957632064819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,8,power_law_1.01,0.6246399879455566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,8,power_law_1.01,0.5965695858001709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,8,power_law_1.01,0.6293504238128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,8,power_law_1.01,0.5648384094238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,8,power_law_1.01,0.6135807991027832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,1,balanced,0.18653333187103271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,1,balanced,0.36403199036916095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,1,balanced,0.7113386789957682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,8,power_law_1.01,0.5924863815307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,1,balanced,1.404586633046468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,8,power_law_1.01,0.6133759975433349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,1,balanced,2.73527463277181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,8,power_law_1.01,0.648806381225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,8,power_law_1.01,0.627507209777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,1,balanced,3.7032960255940757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,8,power_law_1.01,0.6834176063537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,8,power_law_1.01,0.6780928134918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,1,balanced,3.7133652369181314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,8,power_law_1.01,0.6854656219482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,8,power_law_1.01,0.7217152118682861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,1,balanced,3.743743896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,8,power_law_1.01,0.7102464199066162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,1,balanced,3.752959887186686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,8,power_law_1.01,0.7931903839111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,8,power_law_1.01,0.8499199867248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,1,balanced,3.764906565348307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,1,power_law_1.2,0.3907583951950073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,8,power_law_1.01,0.942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,1,balanced,3.7604640324910483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,8,power_law_1.01,1.2072959899902345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,1,balanced,3.7787307103474936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,8,power_law_1.01,1.5327232360839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,1,balanced,3.7949441274007163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,8,power_law_1.01,2.00130558013916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,1,balanced,3.8246399561564126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,8,power_law_1.01,2.726911926269531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,1,balanced,3.853311856587728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,1,balanced,3.878570556640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,8,power_law_1.01,3.237887954711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,1,balanced,3.930453300476074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,1,balanced,4.089173316955566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,1,balanced,4.08678404490153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,1,balanced,4.186794598897298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,1,balanced,4.333733240763347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,1,balanced,4.5745493570963545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,1,balanced,4.9001814524332685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,1,balanced,5.556565602620442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,1,power_law_1.2,0.5236735820770264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,1,balanced,6.303232192993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,1,balanced,8.542207717895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,1,balanced,10.071039835611979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,1,power_law_1.2,0.830668830871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,1,power_law_1.2,1.1239423751831055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,2,power_law_1.2,11.205836486816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,1,power_law_1.2,0.032953599095344545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,1,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,1,power_law_1.2,0.06570240259170532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,1,power_law_1.2,0.24780800342559814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,1,power_law_1.2,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,1,power_law_1.2,0.2486016035079956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,1,power_law_1.2,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,1,power_law_1.2,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,1,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,1,power_law_1.2,0.26562559604644775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,1,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,1,power_law_1.2,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,1,power_law_1.2,0.2758656024932861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,1,power_law_1.2,0.2762752056121826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,1,power_law_1.2,0.28446719646453855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,1,power_law_1.2,0.29675519466400146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,1,power_law_1.2,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,1,power_law_1.2,0.37457919120788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,1,power_law_1.2,0.4216832160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,4,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,4,balanced,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,4,balanced,0.43622398376464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,4,balanced,0.8212426503499349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,4,balanced,1.4912853240966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,4,balanced,2.089471975962321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,4,balanced,2.0980052947998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,4,balanced,2.11027193069458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,4,balanced,2.1164372762044272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,4,balanced,2.1261653900146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,4,balanced,2.134010632832845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,4,balanced,2.1522773106892905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,4,balanced,2.1650773684183755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,4,balanced,2.1915146509806314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,1,power_law_1.2,0.5158912181854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,4,balanced,2.2147413889567056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,4,balanced,2.24017063776652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,4,balanced,2.2855680783589682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,4,balanced,2.330453395843506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,4,balanced,2.4106666247049966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,4,balanced,2.5837225914001465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,4,balanced,2.7622400919596353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,4,balanced,3.110912005106608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,4,balanced,3.477504094441732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,4,balanced,4.3202559153238935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,1,power_law_1.2,0.677888011932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,1,power_law_1.2,1.8165760040283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,4,balanced,5.25875186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,4,balanced,7.241029103597005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,4,balanced,9.172821044921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,1,power_law_1.2,0.9551872253417969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,1,power_law_1.2,1.2959744453430175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,1,power_law_1.2,2.4979455947875975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,2,power_law_1.2,0.19967999458312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,2,power_law_1.2,0.35778560638427737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,2,power_law_1.2,0.4847616195678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,2,power_law_1.2,0.7675903797149658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,2,power_law_1.2,1.042636775970459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,2,power_law_1.2,1.4524415969848632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,2,power_law_1.2,1.9777536392211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,1,power_law_1.2,1.9363840103149415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,2,power_law_1.2,2.1757951736450196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,2,power_law_1.2,2.1389312744140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,2,power_law_1.2,2.1934080123901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,2,power_law_1.2,2.097760009765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,2,power_law_1.2,2.2806528091430662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,2,power_law_1.2,2.2624256134033205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,2,power_law_1.2,2.4465408325195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,2,power_law_1.2,2.411315155029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,2,power_law_1.2,2.430156707763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,2,power_law_1.2,2.4989696502685548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,2,power_law_1.2,2.7013120651245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,2,power_law_1.2,2.7746303558349608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,2,power_law_1.2,2.7994047164916993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,2,power_law_1.2,3.1457279205322264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,2,power_law_1.2,3.584409713745117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,1,power_law_1.2,2.693734359741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,2,power_law_1.2,4.099891281127929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,2,power_law_1.2,5.054668807983399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,2,power_law_1.2,6.280192184448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,2,power_law_1.2,7.912038421630859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,2,power_law_1.2,9.483468627929687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,8,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,8,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,8,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,8,power_law_1.2,0.04872319996356964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,8,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,8,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,8,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,8,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,8,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,8,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,8,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,8,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,8,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,8,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,8,power_law_1.2,0.06654719710350036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,8,power_law_1.2,0.07287039756774902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,8,power_law_1.2,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,8,power_law_1.2,0.14049279689788818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,8,power_law_1.2,0.20008959770202636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,8,power_law_1.2,0.26910719871520994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,8,power_law_1.2,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,8,power_law_1.2,0.4937727928161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,8,power_law_1.2,0.6334464073181152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,8,power_law_1.2,1.2759039878845215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,8,power_law_1.2,1.5830656051635743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,1,power_law_1.2,4.117504119873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,8,power_law_1.2,2.613862419128418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,8,power_law_1.2,3.7126144409179687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,1,power_law_1.2,5.467750549316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,64,power_law_1.2,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,64,power_law_1.2,0.29081599712371825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,64,power_law_1.2,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,64,power_law_1.2,0.28446719646453855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,64,power_law_1.2,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,64,power_law_1.2,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,64,power_law_1.2,0.26255359649658205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,64,power_law_1.2,0.26746881008148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,64,power_law_1.2,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,64,power_law_1.2,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,64,power_law_1.2,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,64,power_law_1.2,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,64,power_law_1.2,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,64,power_law_1.2,0.30351359844207765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,64,power_law_1.2,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,256,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,64,power_law_1.2,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,256,power_law_1.2,0.07535359859466553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,64,power_law_1.2,0.32378880977630614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,256,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,64,power_law_1.2,0.364134407043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,256,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,64,power_law_1.2,0.37416958808898926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,256,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,64,power_law_1.2,0.44359679222106935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,256,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,64,power_law_1.2,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,256,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,64,power_law_1.2,0.685260820388794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,256,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,256,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,256,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,64,power_law_1.2,0.9834495544433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,256,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,8,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,256,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,8,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,256,power_law_1.2,0.0698303997516632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,8,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,64,power_law_1.2,1.4321663856506348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,256,power_law_1.2,0.0899071991443634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,256,power_law_1.2,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,8,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,8,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,256,power_law_1.2,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,8,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,64,power_law_1.2,1.9955711364746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,8,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,256,power_law_1.2,0.15749119520187377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,256,power_law_1.2,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,8,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,8,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,256,power_law_1.2,0.27729918956756594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,8,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,8,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,256,power_law_1.2,0.45424637794494627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,8,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,64,power_law_1.2,2.855936050415039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,8,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,256,power_law_1.2,0.46305279731750487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,8,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,8,power_law_1.2,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,8,power_law_1.2,0.08640639781951905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,256,power_law_1.2,0.7467008113861084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,8,power_law_1.2,0.1669119954109192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,8,power_law_1.2,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,256,power_law_1.2,0.8581119537353515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,8,power_law_1.2,0.37765119075775144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,8,power_law_1.2,0.5537792205810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,256,power_law_1.2,1.5056896209716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,256,power_law_1.2,1.7764352798461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,256,power_law_1.2,3.6792320251464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,8,power_law_1.2,0.8652799606323243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,256,power_law_1.2,4.258201599121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,8,power_law_1.2,1.1997183799743651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,64,power_law_1.2,4.220723342895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,1,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,1,balanced,0.027280000348885853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,1,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,1,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,1,balanced,0.2445653279622396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,1,balanced,0.24627200762430826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,1,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,1,balanced,0.2501973311106364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,1,balanced,0.252074658870697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,1,balanced,0.25463465849558514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,1,balanced,0.2515626748402913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,1,balanced,0.2573653260866801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,1,balanced,0.2611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,1,balanced,0.2706773281097412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,1,balanced,0.2778453429539998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,1,balanced,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,1,balanced,0.31249066193898517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,1,balanced,0.3461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,1,balanced,0.3677866856257121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,1,balanced,0.43485867977142334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,1,balanced,0.5154133240381876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,1,balanced,0.7393279870351156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,1,balanced,1.008128007253011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,1,balanced,1.4834346771240234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,1,balanced,1.9107839266459148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,1,balanced,2.7770560582478843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,1,balanced,3.677525202433268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,16,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,16,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,16,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,8,power_law_1.2,1.823129653930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,16,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,16,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,16,balanced,0.2800319989522298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,16,balanced,0.41335467497507733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,16,balanced,0.4159146547317505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,16,balanced,0.4174506664276123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,16,balanced,0.41779200236002606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,16,balanced,0.42018131415049237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,16,balanced,0.4247893492380778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,16,balanced,0.4261546532313029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,16,balanced,0.43059198061625165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,16,balanced,0.4394666751225789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,16,balanced,0.44202665487925213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,16,balanced,0.4536319971084595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,16,balanced,0.47274665037790936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,16,balanced,0.49612800280253094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,16,balanced,0.5319679975509644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,16,balanced,0.5666133165359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,16,balanced,0.6355626583099365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,16,balanced,0.7526400089263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,16,balanced,1.0106879870096843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,16,balanced,1.2245333194732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,16,balanced,1.6411306063334148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,16,balanced,2.090496063232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,2,power_law_1.01,0.237772798538208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,2,power_law_1.01,0.3999743938446045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,2,power_law_1.01,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,2,power_law_1.01,0.7456768035888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,2,power_law_1.01,1.0266624450683595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,2,power_law_1.01,1.641868782043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,2,power_law_1.01,1.6650239944458007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,2,power_law_1.01,1.7459199905395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,2,power_law_1.01,1.8329599380493165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,2,power_law_1.01,1.8946048736572265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,2,power_law_1.01,1.8536447525024413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,2,power_law_1.01,2.000486373901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,2,power_law_1.01,2.023628807067871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,2,power_law_1.01,2.0731903076171876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,2,power_law_1.01,2.088960075378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,2,power_law_1.01,2.190131187438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,2,power_law_1.01,2.3044095993041993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,2,power_law_1.01,2.4655872344970704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,2,power_law_1.01,2.653798484802246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,8,power_law_1.2,2.6595327377319338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,2,power_law_1.01,3.0099456787109373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,2,power_law_1.01,3.465216064453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,2,power_law_1.01,4.33172492980957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,2,power_law_1.01,4.937318420410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,2,power_law_1.01,6.886399841308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,2,power_law_1.01,8.435494232177735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,2,power_law_1.01,11.73012466430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,2,power_law_1.01,15.112396240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,32,power_law_1.01,0.3231744050979614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,32,power_law_1.01,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,32,power_law_1.01,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,32,power_law_1.01,0.2910207986831665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,32,power_law_1.01,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,32,power_law_1.01,0.2396159887313843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,32,power_law_1.01,0.26746881008148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,32,power_law_1.01,0.26910719871520994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,32,power_law_1.01,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,32,power_law_1.01,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,32,power_law_1.01,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,32,power_law_1.01,0.29409279823303225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,32,power_law_1.01,0.28979198932647704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,32,power_law_1.01,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,32,power_law_1.01,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,32,power_law_1.01,0.33136639595031736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,32,power_law_1.01,0.32727038860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,32,power_law_1.01,0.36450560092926027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,32,power_law_1.01,0.3870719909667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,32,power_law_1.01,0.45465598106384275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,32,power_law_1.01,0.4908927917480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,32,power_law_1.01,0.6006783962249755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,32,power_law_1.01,0.8011712074279785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,32,power_law_1.01,1.217740821838379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,32,power_law_1.01,1.6113664627075195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,32,power_law_1.01,2.269593620300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,32,power_law_1.01,3.27720947265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,128,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,128,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,128,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,128,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,128,balanced,0.02696000039577484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,128,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,128,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,128,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,128,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,128,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,128,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,128,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,128,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,128,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,128,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,128,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,128,balanced,0.03155199935038885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,128,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,128,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,128,balanced,0.03513066718975703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,128,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,128,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,128,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,128,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,128,balanced,0.0744053324063619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,128,balanced,0.15240533153216043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,128,balanced,0.22579199075698853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,8,power_law_1.2,0.1691648006439209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,8,power_law_1.2,0.2689023971557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,8,power_law_1.2,0.3452928066253662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,8,power_law_1.2,0.33914239406585694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,8,power_law_1.2,0.29859840869903564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,8,power_law_1.2,0.39772160053253175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,8,power_law_1.2,0.40960001945495605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,8,power_law_1.2,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,8,power_law_1.2,0.43335680961608886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,8,power_law_1.2,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,8,power_law_1.2,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,8,power_law_1.2,0.4769792079925537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,8,power_law_1.2,0.4577280044555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,8,power_law_1.2,0.48865280151367185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,8,power_law_1.2,0.4982719898223877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,8,power_law_1.2,0.49356799125671386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,8,power_law_1.2,0.5058559894561767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,1,power_law_1.01,1.0571776390075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,8,power_law_1.2,0.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,8,power_law_1.2,0.5857279777526856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,1,power_law_1.01,2.045952033996582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,8,power_law_1.2,0.738099193572998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,8,power_law_1.2,0.7938047885894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,8,power_law_1.2,1.0270719528198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,1,power_law_1.01,4.125696182250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,8,power_law_1.2,1.1513855934143067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,1,power_law_1.01,8.190361785888673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,8,power_law_1.2,1.599078369140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,8,power_law_1.2,1.7102848052978517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,1,power_law_1.01,12.046336364746093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,1,power_law_1.01,16.376626586914064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,8,power_law_1.2,2.4971263885498045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,1,power_law_1.01,22.40921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,1,power_law_1.01,23.474790954589842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,2,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,2,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,2,balanced,0.029002666473388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,2,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,2,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,2,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,2,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,2,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,2,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,2,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,2,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,2,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,2,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,2,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,2,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,2,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,2,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,2,balanced,0.08755200107892354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,2,balanced,0.09540266791979472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,2,balanced,0.1646933356920878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,2,balanced,0.2121386726697286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,8,power_law_1.2,3.3198078155517576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,2,balanced,0.3227306604385376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,2,balanced,0.4322986602783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,2,balanced,0.636245330174764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,2,balanced,0.86135466893514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,2,balanced,1.3769386609395344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,1,power_law_1.01,24.531968688964845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,2,balanced,1.9157333374023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,1,power_law_1.01,25.00095977783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,1,power_law_1.01,26.384384155273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,1,power_law_1.01,26.655947875976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,1,power_law_1.01,27.271783447265626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,1,power_law_1.01,28.51143798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,1,power_law_1.01,29.54649658203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,1,power_law_1.01,30.334567260742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,1,power_law_1.01,30.486734008789064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,1,power_law_1.01,33.27057800292969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,2,power_law_1.01,0.6162432193756103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,2,power_law_1.01,0.9752575874328613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,2,power_law_1.01,1.410041618347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,2,power_law_1.01,2.174566459655762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,2,power_law_1.01,2.6761215209960936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,1,power_law_1.01,34.47193603515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,2,power_law_1.01,4.137369537353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,2,power_law_1.01,4.4777473449707035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,2,power_law_1.01,4.635033416748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,2,power_law_1.01,4.755865478515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,2,power_law_1.01,4.807270431518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,2,power_law_1.01,4.991385650634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,1,power_law_1.01,36.89738159179687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,2,power_law_1.01,5.053440093994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,2,power_law_1.01,5.151948928833008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,2,power_law_1.01,5.455257415771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,2,power_law_1.01,5.531852722167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,2,power_law_1.01,5.590630340576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,2,power_law_1.01,5.642444610595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,2,power_law_1.01,6.143180847167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,1,power_law_1.01,38.88414611816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,2,power_law_1.01,6.2283775329589846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,2,power_law_1.01,6.850764465332031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,2,power_law_1.01,7.016652679443359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,2,power_law_1.01,8.855757141113282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,1,power_law_1.01,41.421209716796874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,2,power_law_1.01,9.009561920166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,2,power_law_1.01,11.70862045288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,2,power_law_1.01,14.341734313964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,16,power_law_1.2,0.315391993522644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,16,power_law_1.2,0.5345280170440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,16,power_law_1.2,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,16,power_law_1.2,0.5240767955780029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,1,power_law_1.01,49.99638977050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,16,power_law_1.2,0.5492735862731933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,2,power_law_1.01,20.252056884765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,16,power_law_1.2,0.42885122299194334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,16,power_law_1.2,0.48127360343933107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,16,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,16,power_law_1.2,0.4724736213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,16,power_law_1.01,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,16,power_law_1.2,0.47411198616027833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,16,power_law_1.01,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,16,power_law_1.01,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,16,power_law_1.2,0.4956160068511963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,16,power_law_1.2,0.4753407955169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,16,power_law_1.01,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,16,power_law_1.2,0.5232639789581299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,16,power_law_1.01,0.20169599056243898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,16,power_law_1.01,0.2289664030075073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,16,power_law_1.2,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,16,power_law_1.01,0.28037118911743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,16,power_law_1.2,0.5292031764984131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,16,power_law_1.01,0.2519040107727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,16,power_law_1.2,0.5465919971466064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,16,power_law_1.01,0.24657919406890869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,16,power_law_1.2,0.5302271842956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,16,power_law_1.01,0.27402238845825194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,16,power_law_1.2,0.5810175895690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,16,power_law_1.01,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,16,power_law_1.01,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,16,power_law_1.2,0.6303743839263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,16,power_law_1.01,0.26972160339355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,16,power_law_1.2,0.689356803894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,16,power_law_1.01,0.3033087968826294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,16,power_law_1.01,0.2920448064804077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,16,power_law_1.2,0.7845888137817383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,2,power_law_1.01,23.964877319335937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,16,power_law_1.01,0.29160959720611573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,16,power_law_1.2,0.8372223854064942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,16,power_law_1.01,0.33873920440673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,16,power_law_1.01,0.35348479747772216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,16,power_law_1.2,1.015193557739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,16,power_law_1.01,0.39872639179229735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,16,power_law_1.01,0.45465598106384275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,16,power_law_1.2,1.3770751953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,256,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,256,power_law_1.01,0.058329600095748904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,16,power_law_1.01,0.6238207817077637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,256,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,16,power_law_1.2,1.8939903259277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,16,power_law_1.01,0.7921664237976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,256,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,256,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,16,power_law_1.01,1.131929588317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,256,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,16,power_law_1.2,2.509209632873535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,256,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,256,power_law_1.01,0.06263039708137512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,16,power_law_1.01,1.600102424621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,256,power_law_1.01,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,256,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,16,power_law_1.2,3.331276702880859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,256,power_law_1.01,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,16,power_law_1.01,2.211635208129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,256,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,256,power_law_1.01,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,256,power_law_1.01,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,256,power_law_1.01,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,256,power_law_1.01,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,16,power_law_1.2,4.254924774169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,16,power_law_1.01,2.982912063598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,256,power_law_1.01,0.11448320150375366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,256,power_law_1.01,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,1,power_law_1.01,58.8521484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,256,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,256,power_law_1.01,0.3645440101623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,256,power_law_1.01,0.49848318099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,256,power_law_1.01,0.7202816009521484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,256,power_law_1.01,0.881049633026123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,256,power_law_1.01,1.4104576110839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,256,power_law_1.01,1.985331153869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,256,power_law_1.01,3.030220794677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,256,power_law_1.01,4.403596878051758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,1,power_law_1.01,66.37833251953126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,1,power_law_1.01,87.62777709960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,1,power_law_1.01,87.9941650390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,32,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,32,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,32,power_law_1.2,0.027423998713493346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,32,power_law_1.2,0.025183999538421632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,32,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,32,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,32,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,32,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,32,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,32,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,32,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,32,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,32,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,32,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,32,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,32,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,32,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,32,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,32,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,32,power_law_1.2,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,32,power_law_1.2,0.10035200119018554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,32,power_law_1.2,0.12554240226745605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,32,power_law_1.2,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,32,power_law_1.2,0.4050943851470947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,32,power_law_1.2,0.4167679786682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,32,power_law_1.2,0.7385087966918945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,1,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,1,power_law_1.2,0.3082240104675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,1,power_law_1.2,0.5683199882507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,1,power_law_1.2,0.8335359573364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,1,power_law_1.2,1.1401087760925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,1,power_law_1.2,2.0934656143188475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,1,power_law_1.2,2.29355525970459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,1,power_law_1.2,2.36810245513916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,1,power_law_1.2,2.4793088912963865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,1,power_law_1.2,2.494259262084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,1,power_law_1.2,2.616524887084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,1,power_law_1.2,2.657894325256348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,1,power_law_1.2,2.678144073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,1,power_law_1.2,2.7727872848510744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,1,power_law_1.2,2.8284927368164063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,32,power_law_1.2,1.0915840148925782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,1,power_law_1.2,2.8844032287597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,1,power_law_1.2,2.981068801879883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,1,power_law_1.2,3.1662080764770506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,1,power_law_1.2,3.3812480926513673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,1,power_law_1.2,3.7740543365478514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,1,power_law_1.2,4.202867126464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,1,power_law_1.2,5.0460670471191404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,1,power_law_1.2,5.719244766235351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,1,power_law_1.2,7.4829566955566404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,1,power_law_1.2,8.997478485107422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,1,power_law_1.2,12.448973083496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.02863999903202057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.04809600114822388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.09728000164031983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.10424319505691529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.13312000036239624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.19824639558792115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,1,power_law_1.2,16.1691650390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.36618239879608155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.7921664237976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,1,power_law_1.01,1.234943962097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,1,power_law_1.01,1.6748544692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,32,power_law_1.01,0.4181951999664307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,32,power_law_1.01,0.3780607938766479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,32,power_law_1.01,0.3792896032333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,32,power_law_1.01,0.3248127937316895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,32,power_law_1.01,0.260915207862854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,32,power_law_1.01,0.3411967992782593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,32,power_law_1.01,0.37128961086273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,32,power_law_1.01,0.3852288007736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,4,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,32,power_law_1.01,0.3876800060272217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,4,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,32,power_law_1.01,0.39096319675445557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,4,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,32,power_law_1.01,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,4,power_law_1.01,0.03971840143203735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,32,power_law_1.01,0.3985408067703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,4,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,4,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,32,power_law_1.01,0.40181760787963866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,4,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,32,power_law_1.01,0.3895296096801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,4,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,32,power_law_1.01,0.42270717620849607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,4,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,4,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,32,power_law_1.01,0.4014080047607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,4,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,32,power_law_1.01,0.43581438064575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,4,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,4,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,32,power_law_1.01,0.46919679641723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,4,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,32,power_law_1.01,0.4855807781219482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,4,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,4,power_law_1.01,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,32,power_law_1.01,0.6193151950836182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,4,power_law_1.01,0.1112064003944397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,4,power_law_1.01,0.1716223955154419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,32,power_law_1.01,0.7868415832519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,4,power_law_1.01,0.20377600193023682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,4,power_law_1.01,0.2717695951461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,32,power_law_1.01,1.1192319869995118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,4,power_law_1.01,0.34508800506591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,4,power_law_1.01,0.5165056228637696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,32,power_law_1.01,1.1321344375610352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,4,power_law_1.01,0.7114751815795899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,32,power_law_1.01,1.7108991622924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,4,power_law_1.01,1.1538432121276856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,4,power_law_1.01,1.5005696296691895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,32,power_law_1.01,2.2538240432739256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,4,power_law_1.01,2.6613759994506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,32,power_law_1.01,3.116441535949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,4,power_law_1.01,2.994790458679199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,32,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,32,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,32,power_law_1.01,4.877721786499023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,32,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,32,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,32,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,32,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,32,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,32,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,32,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,32,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,32,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,32,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,32,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,32,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,32,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,32,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,32,power_law_1.01,0.08110079765319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,32,power_law_1.01,0.10341119766235352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,32,power_law_1.01,0.16936960220336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,32,power_law_1.01,0.255180811882019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,32,power_law_1.01,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,32,power_law_1.01,0.4065279960632324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,32,power_law_1.01,0.5273407936096192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,32,power_law_1.01,0.7813119888305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,1,power_law_1.01,2.5489408493041994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,32,power_law_1.01,1.042636775970459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,32,power_law_1.01,1.6740352630615234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,32,power_law_1.01,2.278803253173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,1,power_law_1.01,3.3544063568115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.04442239999771118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.07515519857406616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.20622720718383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.22568960189819337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.24248321056365968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.2568192005157471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.28936960697174074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.30699520111083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.35614719390869143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.43274240493774413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.5380095958709716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.7987199783325195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,1,power_law_1.2,1.053286361694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,1,power_law_1.2,1.5247360229492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,1,power_law_1.2,2.0041664123535154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,1,power_law_1.2,3.033497619628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,1,power_law_1.2,4.0609790802001955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,1,power_law_1.2,6.212812805175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,1,power_law_1.2,8.345394897460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,32,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,32,balanced,0.2903040051460266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,32,balanced,0.5787306626637777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,32,balanced,0.5509119828542074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,32,balanced,0.5423786640167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,32,balanced,0.5457919836044312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,32,balanced,0.5468159914016724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,32,balanced,0.5485226710637411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,32,balanced,0.5522773265838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,32,balanced,0.5562026500701904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,32,balanced,0.5631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,32,balanced,0.5707093477249146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,32,balanced,0.5780479907989502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,32,balanced,0.5910186767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,32,balanced,0.6135466496149699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,32,balanced,0.6490453481674194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,32,balanced,0.7009279727935791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,32,balanced,0.7374506791432699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,32,balanced,0.807423988978068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,32,balanced,0.8900266488393148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,32,balanced,1.1118933359781902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,32,balanced,1.3870080312093098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,32,balanced,1.8781867027282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,32,balanced,2.394282658894857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.12165119647979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.25477120876312254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.36966400146484374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.510361623764038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.7530496120452881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.8022015571594239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.8433664321899415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.8495039939880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.9154560089111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.9480192184448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,1,power_law_1.2,1.0145792007446288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,1,power_law_1.2,1.0790911674499513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,1,power_law_1.2,1.1425791740417481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,1,power_law_1.2,1.1833344459533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,1,power_law_1.2,1.297612762451172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,1,power_law_1.2,1.5208448410034179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,1,power_law_1.2,1.7522687911987305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,1,power_law_1.2,2.153881645202637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,1,power_law_1.2,2.5673728942871095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,1,power_law_1.2,3.432223892211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,1,power_law_1.2,4.343193435668946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,1,power_law_1.2,6.212607955932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,1,power_law_1.2,8.020377349853515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,1,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,1,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,1,balanced,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,1,balanced,0.45960533618927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,1,balanced,0.8866133689880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,1,balanced,0.8939359982808431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,1,balanced,0.900597333908081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,1,balanced,0.9074347019195557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,1,balanced,0.9149333635965983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,1,balanced,0.9217706521352133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,1,balanced,0.9323519865671793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,1,balanced,0.9478826522827148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,1,balanced,0.9620479742685953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,1,balanced,0.9838933149973551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,1,balanced,1.0246826807657878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,1,power_law_1.2,11.734630584716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,1,balanced,1.0509653091430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,1,balanced,1.106602668762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,1,balanced,1.185109297434489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,1,balanced,1.3035519917805989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,1,balanced,1.5340959231058757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,1,balanced,1.7483092943827312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,1,balanced,2.2507519721984863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,8,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,1,balanced,2.7511466344197593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,8,power_law_1.2,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,8,power_law_1.2,0.2578239917755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,8,power_law_1.2,0.32911360263824463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,1,balanced,3.867136001586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,8,power_law_1.2,0.3645440101623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,1,power_law_1.2,15.500480651855469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,8,power_law_1.2,0.33280000686645506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,8,power_law_1.2,0.3655679941177368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,8,power_law_1.2,0.3575808048248291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,1,balanced,5.012821197509766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,8,power_law_1.2,0.37765119075775144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,8,power_law_1.2,0.35880959033966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,8,power_law_1.2,0.369049596786499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,8,power_law_1.2,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,8,power_law_1.2,0.38871040344238283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,8,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,8,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,8,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,1,balanced,7.280469258626302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,8,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,8,power_law_1.2,0.40611839294433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,8,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,8,balanced,0.03839466720819473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,8,balanced,0.03873066604137421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,8,power_law_1.2,0.4210559844970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,8,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,8,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,8,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,8,power_law_1.2,0.40857601165771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,8,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,8,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,8,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,8,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,8,power_law_1.2,0.43294720649719237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,8,balanced,0.07099733253320058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,8,balanced,0.09198932846387227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,8,balanced,0.16725333531697592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,8,power_law_1.2,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,8,balanced,0.19592533508936563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,8,balanced,0.2539520064989726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,8,power_law_1.2,0.5152768135070801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,8,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,8,balanced,0.36266668637593585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,1,balanced,9.47438939412435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,8,power_law_1.2,0.5863423824310303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,8,balanced,0.438101331392924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,8,balanced,0.6652586857477824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,8,power_law_1.2,0.6676479816436768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,8,balanced,0.8845653533935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,8,power_law_1.2,0.9582464218139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,8,power_law_1.2,1.2500991821289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,8,power_law_1.2,1.8331647872924806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,8,power_law_1.2,2.1215232849121093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,8,power_law_1.2,3.19815673828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,4,power_law_1.2,0.03991039991378784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,4,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,4,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,4,power_law_1.2,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,4,power_law_1.2,0.1861631989479065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,4,power_law_1.2,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,4,power_law_1.2,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,4,power_law_1.2,0.3184639930725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,4,power_law_1.2,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,4,power_law_1.2,0.30351359844207765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,4,power_law_1.2,0.2988032102584839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,4,power_law_1.2,0.3215359926223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,4,power_law_1.2,0.3351360082626343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,4,power_law_1.2,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,4,power_law_1.2,0.3590143918991089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,4,power_law_1.2,0.3536895990371704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,4,power_law_1.2,0.3778559923171997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,4,power_law_1.2,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,4,power_law_1.2,0.4118527889251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,4,power_law_1.2,0.4704256057739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,4,power_law_1.2,0.5025792121887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,4,power_law_1.2,0.6479872226715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,4,power_law_1.2,0.8888319969177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,4,power_law_1.2,1.1485183715820313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,4,power_law_1.2,1.6345087051391602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,4,power_law_1.2,2.2222848892211915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,4,power_law_1.2,2.6841087341308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,8,power_law_1.2,4.422451019287109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,32,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,32,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,32,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,32,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,32,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,32,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,32,power_law_1.01,0.034176000952720643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,32,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,32,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,32,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,32,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,32,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,32,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,32,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,32,power_law_1.01,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,32,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,32,power_law_1.01,0.09215360283851623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,32,power_law_1.01,0.11711360216140747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,32,power_law_1.01,0.1464319944381714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,32,power_law_1.01,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,32,power_law_1.01,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,32,power_law_1.01,0.3856384038925171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,32,power_law_1.01,0.48435201644897463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,32,power_law_1.01,0.7094272136688232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,32,power_law_1.01,1.1118592262268066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,32,power_law_1.01,1.762713623046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,32,power_law_1.01,2.2384639739990235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,2,power_law_1.01,1.1046784400939942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,2,power_law_1.01,2.0428672790527345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,2,power_law_1.01,3.1062015533447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,2,power_law_1.01,5.013708877563476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,2,power_law_1.01,6.352486419677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,2,power_law_1.01,8.3810302734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,2,power_law_1.01,12.252569580078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,2,power_law_1.01,12.101631927490235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,2,power_law_1.01,13.00869140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,2,power_law_1.01,13.27247314453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,2,power_law_1.01,13.449215698242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,2,power_law_1.01,13.435289001464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,2,power_law_1.01,14.162535095214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,2,power_law_1.01,14.142874145507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,2,power_law_1.01,14.559027099609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,2,power_law_1.01,15.769190979003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,2,power_law_1.01,16.359219360351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,2,power_law_1.01,18.158387756347658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,2,power_law_1.01,16.869171142578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,4,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,4,power_law_1.01,0.29531519412994384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,4,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,4,power_law_1.01,0.36823039054870604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,4,power_law_1.01,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,4,power_law_1.01,0.6531072139739991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,4,power_law_1.01,0.6692543983459472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,4,power_law_1.01,0.6531072139739991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,4,power_law_1.01,0.7034880161285401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,2,power_law_1.01,17.974272155761717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,4,power_law_1.01,0.6674431800842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,4,power_law_1.01,0.6969344139099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,4,power_law_1.01,0.7069695949554443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,4,power_law_1.01,0.7430143833160401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,4,power_law_1.01,0.7331711769104003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,4,power_law_1.01,0.7604224205017089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,4,power_law_1.01,0.7878655910491943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,4,power_law_1.01,0.8314559936523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,4,power_law_1.01,0.8669183731079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,4,power_law_1.01,0.8912768363952637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,4,power_law_1.01,1.081721591949463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,2,power_law_1.01,18.77442626953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,4,power_law_1.01,1.156710433959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,4,power_law_1.01,1.5773695945739745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,4,power_law_1.01,1.9771007537841796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,4,power_law_1.01,2.575359916687012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,4,power_law_1.01,3.104767990112305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,2,power_law_1.01,20.795802307128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,4,power_law_1.01,4.517068862915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,4,power_law_1.01,6.318694305419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,2,power_law_1.01,24.862106323242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,16,power_law_1.2,0.5982207775115966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,16,power_law_1.2,1.0561535835266114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,16,power_law_1.2,0.9119744300842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,16,power_law_1.2,1.0422271728515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,16,power_law_1.2,1.036473560333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,2,power_law_1.01,31.663104248046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,16,power_law_1.2,0.7641088008880615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,16,power_law_1.2,0.8660991668701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,16,power_law_1.2,0.9005056381225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,16,power_law_1.2,0.8759296417236329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,16,power_law_1.2,0.8685248374938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,16,power_law_1.2,0.9127936363220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,16,power_law_1.2,0.9809920310974121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,16,power_law_1.2,0.9984000205993653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,16,power_law_1.2,0.9988096237182618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,16,power_law_1.2,1.010483169555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,16,power_law_1.2,1.0469375610351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,16,power_law_1.2,1.100166416168213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,16,power_law_1.2,1.1036416053771974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,16,power_law_1.2,1.1610112190246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,2,power_law_1.01,30.305892944335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,16,power_law_1.2,1.401036834716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,16,power_law_1.2,1.561190414428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,16,power_law_1.2,2.0727680206298826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,16,power_law_1.2,2.3726079940795897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,16,power_law_1.2,3.782041549682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,16,power_law_1.2,3.932160186767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,16,power_law_1.2,5.38603515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,4,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,4,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,16,power_law_1.2,7.324877166748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,4,power_law_1.01,0.2996223926544189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,2,power_law_1.01,38.385049438476564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,4,power_law_1.01,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,4,power_law_1.01,0.40960001945495605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,4,power_law_1.01,0.532480001449585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,4,power_law_1.01,0.5257215976715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,4,power_law_1.01,0.6543360233306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,4,power_law_1.01,0.6070271968841553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,4,power_law_1.01,0.628326416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,4,power_law_1.01,0.6533120155334473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,4,power_law_1.01,0.6846464157104493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,4,power_law_1.01,0.6428671836853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,4,power_law_1.01,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,4,power_law_1.01,0.7223296165466309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,4,power_law_1.01,0.7514111995697021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,4,power_law_1.01,0.7733248233795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,4,power_law_1.01,0.8622079849243164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,4,power_law_1.01,0.9490431785583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,4,power_law_1.01,1.0332159996032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,4,power_law_1.01,1.1618304252624512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,4,power_law_1.01,1.478656005859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,4,power_law_1.01,1.788096046447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,2,power_law_1.01,46.888345336914064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,4,power_law_1.01,2.287820816040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,4,power_law_1.01,2.7860992431640623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,4,power_law_1.01,4.0177665710449215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,4,power_law_1.01,5.157478332519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,8,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,8,power_law_1.01,0.2922368049621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,8,power_law_1.01,0.5437439918518067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,8,power_law_1.01,0.4792319774627686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,8,power_law_1.01,0.5697535991668701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,8,power_law_1.01,0.7079936027526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,8,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,8,power_law_1.01,0.7010303974151612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,8,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,8,power_law_1.01,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,8,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,8,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,8,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,8,power_law_1.01,0.68853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,8,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,8,power_law_1.01,0.7428095817565918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,8,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,8,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,8,power_law_1.01,0.6500351905822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,8,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,8,power_law_1.2,0.0706496000289917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,8,power_law_1.01,0.6582272052764893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,8,power_law_1.2,0.07454720139503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,8,power_law_1.2,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,8,power_law_1.01,0.6639616012573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,8,power_law_1.2,0.07475200295448303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,8,power_law_1.2,0.12267520427703857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,8,power_law_1.01,0.7008255958557129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,8,power_law_1.2,0.1632256031036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,8,power_law_1.01,0.7378943920135498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,8,power_law_1.01,0.7657472133636475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,8,power_law_1.01,0.7589888095855712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,8,power_law_1.2,0.2066431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,8,power_law_1.01,0.8112128257751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,8,power_law_1.2,0.25231359004974363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,8,power_law_1.01,0.8859647750854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,8,power_law_1.01,0.9558015823364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,8,power_law_1.01,1.0526720046997071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,8,power_law_1.2,0.42699518203735354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,8,power_law_1.01,1.1988991737365722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,8,power_law_1.2,0.587775993347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,8,power_law_1.01,1.4782464027404785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,8,power_law_1.01,1.826406478881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,8,power_law_1.01,2.4303615570068358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,8,power_law_1.01,3.4947071075439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,8,power_law_1.01,4.332953643798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,8,power_law_1.2,0.9371647834777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,8,power_law_1.2,1.2103679656982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,8,power_law_1.2,2.1125120162963866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,2,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,2,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,2,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,2,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,2,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,8,power_law_1.2,2.6222591400146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,2,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,2,power_law_1.01,0.07822719812393189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,2,power_law_1.01,0.07924479842185975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,2,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,2,power_law_1.01,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,2,power_law_1.01,0.1087488055229187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,2,power_law_1.01,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,2,power_law_1.01,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,2,power_law_1.01,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,2,power_law_1.01,0.20213758945465088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,2,power_law_1.01,0.20541439056396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,2,power_law_1.01,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,2,power_law_1.01,0.27238399982452394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,2,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,2,power_law_1.01,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,2,power_law_1.01,0.4143104076385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,2,power_law_1.01,0.5677055835723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,2,power_law_1.01,0.7370751857757568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,2,power_law_1.01,1.225318431854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,2,power_law_1.01,1.6066560745239258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,2,power_law_1.01,2.4211456298828127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,2,power_law_1.01,3.141427230834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,32,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,32,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,32,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,32,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,32,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,32,balanced,0.05169600248336792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,32,balanced,0.052042668064435325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,32,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,32,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,32,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,32,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,32,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,32,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,32,balanced,0.06739200154940288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,32,balanced,0.07901866734027863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,32,balanced,0.07814399898052216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,32,balanced,0.09745066364606221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,32,balanced,0.1088853379090627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,32,balanced,0.19933867454528809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,32,balanced,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,32,balanced,0.34541865189870197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,32,balanced,0.494762659072876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,32,balanced,0.6958080132802328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,32,balanced,0.9739946524302164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,1,power_law_1.2,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,1,power_law_1.2,0.7833600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,1,power_law_1.2,1.1266048431396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,1,power_law_1.2,2.0097024917602537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,1,power_law_1.2,1.9695615768432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,1,power_law_1.2,2.0490240097045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,1,power_law_1.2,2.0131839752197265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,1,power_law_1.2,2.020556831359863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,1,power_law_1.2,2.1614591598510744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,1,power_law_1.2,2.209587287902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,1,power_law_1.2,2.1825536727905273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,1,power_law_1.2,2.446131134033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,1,power_law_1.2,2.4152063369750976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,1,power_law_1.2,2.5446399688720702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,1,power_law_1.2,2.686771202087402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,1,power_law_1.2,2.79101448059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,1,power_law_1.2,3.1494144439697265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,1,power_law_1.2,3.647488021850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,1,power_law_1.2,4.103987121582032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,1,power_law_1.2,5.1138561248779295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,1,power_law_1.2,5.844787216186523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,4,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,4,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,4,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,4,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,4,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,4,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,4,power_law_1.2,0.130457603931427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,4,power_law_1.2,0.09789440035820007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,4,power_law_1.2,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,4,power_law_1.2,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,4,power_law_1.2,0.10854400396347046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,4,power_law_1.2,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,4,power_law_1.2,0.11939840316772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,4,power_law_1.2,0.15851520299911498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,4,power_law_1.2,0.15155199766159058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,4,power_law_1.2,0.18718719482421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,4,power_law_1.2,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,4,power_law_1.2,0.23060479164123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,4,power_law_1.2,0.2727936029434204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,4,power_law_1.2,0.3135488033294678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,4,power_law_1.2,0.3704832077026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,4,power_law_1.2,0.4636672019958496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,1,power_law_1.2,7.878041839599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,4,power_law_1.2,0.608460807800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,4,power_law_1.2,0.9426943778991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,4,power_law_1.2,1.2412927627563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,4,power_law_1.2,2.0129791259765626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,4,power_law_1.2,2.781388854980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,32,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,32,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,32,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,32,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,32,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,32,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,32,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,32,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,32,balanced,0.052373334765434265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,32,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,32,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,32,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,32,balanced,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,32,balanced,0.06963199873765309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,32,balanced,0.07849066456158955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,32,balanced,0.14967466394106546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,32,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,32,balanced,0.318122665087382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,32,balanced,0.4322986602783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,32,balanced,0.6075733502705892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,32,balanced,0.8031573295593262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,32,balanced,1.1915946801503499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,32,balanced,1.57149871190389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,1,power_law_1.2,9.823641967773437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,1,balanced,0.6324906746546427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,1,balanced,1.1043840249379475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,1,balanced,2.1614933013916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,1,balanced,4.258303960164388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,1,balanced,8.45038922627767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,1,balanced,10.575018564860025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,1,balanced,10.619391759236654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,1,balanced,10.648064295450846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,1,power_law_1.2,13.523968505859376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,1,balanced,10.679978688557943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,1,balanced,10.707285563151041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,1,balanced,10.765141805013021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,32,power_law_1.01,0.03192960023880005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,32,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,32,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,32,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,32,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,1,balanced,10.823168436686197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,32,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,32,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,32,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,32,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,32,power_law_1.01,0.031737598776817325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,32,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,32,power_law_1.01,0.03521279990673065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,1,balanced,10.869247436523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,32,power_law_1.01,0.04340479969978332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,32,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,32,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,32,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,32,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,32,power_law_1.01,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,32,power_law_1.01,0.12799999713897706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,1,balanced,10.957141876220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,32,power_law_1.01,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,32,power_law_1.01,0.26214399337768557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,32,power_law_1.01,0.3942399978637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,32,power_law_1.01,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,1,balanced,11.044522603352865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,32,power_law_1.01,0.8988672256469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,32,power_law_1.01,1.053286361694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,1,balanced,11.123029073079428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,1,balanced,11.263317108154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,1,balanced,11.546794891357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,1,balanced,11.838976542154947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,1,power_law_1.2,18.10636749267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,1,balanced,13.317972819010416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,1,balanced,12.747093200683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,1,balanced,13.62124760945638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,1,balanced,14.431915283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,1,balanced,17.659210205078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,1,balanced,20.429312388102215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,1,balanced,30.671526590983074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,1,balanced,41.120768229166664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,1,power_law_1.2,26.714111328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,1,power_law_1.2,35.297689819335936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,8,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,8,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,8,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,8,balanced,0.5393066803614298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,8,balanced,1.0325226783752441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,8,balanced,1.5243946711222331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,8,balanced,1.527978738149007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,8,balanced,1.53275728225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,8,balanced,1.5356586774190266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,8,balanced,1.5426559448242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,64,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,8,balanced,1.5489706993103027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,64,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,64,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,64,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,64,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,64,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,8,balanced,1.555456002553304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,64,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,64,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,64,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,64,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,64,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,8,balanced,1.5668907165527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,64,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,64,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,64,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,64,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,64,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,8,balanced,1.5830933252970378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,64,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,64,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,64,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,64,balanced,0.06673066814740498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,8,balanced,1.593173344930013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,64,balanced,0.08002133170763652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,64,balanced,0.1032533347606659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,8,balanced,1.6139945983886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,64,balanced,0.13448533415794373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,64,balanced,0.2775040070215861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,8,balanced,1.6575147310892742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,64,balanced,0.3537919918696086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,8,balanced,1.6976213455200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,64,balanced,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,8,balanced,1.774079958597819
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,64,balanced,0.7191893259684244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,8,balanced,1.849514643351237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,8,balanced,2.0113066037495932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,8,balanced,2.1700266202290854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,8,balanced,2.520064036051432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,8,balanced,2.893312136332194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,8,balanced,3.722240130106608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,8,balanced,4.683093388875325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,16,power_law_1.01,0.4579328060150146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,16,power_law_1.01,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,16,power_law_1.01,0.4597760200500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,16,power_law_1.01,0.44646401405334474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,16,power_law_1.01,0.41553921699523927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,16,power_law_1.01,0.44748802185058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,16,power_law_1.01,0.45035519599914553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,16,power_law_1.01,0.4448256015777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,16,power_law_1.01,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,16,power_law_1.01,0.44707841873168946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,16,power_law_1.01,0.45998082160949705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,16,power_law_1.01,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,16,power_law_1.01,0.4626431941986084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,16,power_law_1.01,0.4966271877288818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,16,power_law_1.01,0.49049601554870603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,16,power_law_1.01,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,16,power_law_1.01,0.49889278411865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,16,power_law_1.01,0.5369855880737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,16,power_law_1.01,0.601087999343872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,16,power_law_1.01,0.7124991893768311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,16,power_law_1.01,0.8546303749084473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,16,power_law_1.01,1.2281855583190917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,16,power_law_1.01,1.3467647552490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,16,power_law_1.01,2.0451263427734374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,16,power_law_1.01,2.4041343688964845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,16,power_law_1.01,3.9421951293945314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,16,power_law_1.01,5.224652862548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,16,power_law_1.01,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,16,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,16,power_law_1.01,0.06244480013847351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,16,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,16,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,4,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,4,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,4,balanced,0.284986674785614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,16,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,4,balanced,0.5538133382797241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,4,balanced,1.0437973340352376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,16,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,16,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,4,balanced,2.0152319272359214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,16,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,4,balanced,2.0237654050191245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,16,power_law_1.01,0.06532480120658875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,4,balanced,2.0613120396931968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,16,power_law_1.01,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,16,power_law_1.01,0.07475200295448303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,4,balanced,2.0672853787740073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,16,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,4,balanced,2.072234630584717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,16,power_law_1.01,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,16,power_law_1.01,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,4,balanced,2.049194653828939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,16,power_law_1.01,0.0899071991443634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,16,power_law_1.01,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,4,balanced,2.0616532961527505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,16,power_law_1.01,0.1562559962272644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,4,balanced,2.071381409962972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,16,power_law_1.01,0.1773568034172058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,4,balanced,2.090837319691976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,4,balanced,2.1090985933939614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,4,balanced,2.1234347025553384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,4,balanced,2.156533400217692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,16,power_law_1.01,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,4,balanced,2.219834645589193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,16,power_law_1.01,0.27934720516204836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,16,power_law_1.01,0.36739840507507326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,4,balanced,2.2823146184285483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,16,power_law_1.01,0.5519167900085449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,4,balanced,2.395136038462321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,16,power_law_1.01,0.912384033203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,4,balanced,2.5352320671081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,16,power_law_1.01,1.2087295532226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,4,balanced,2.776063919067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,16,power_law_1.01,2.022604751586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,4,balanced,3.0064640045166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,4,balanced,3.4737494786580405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,16,power_law_1.01,2.768889617919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,4,balanced,4.064768155415853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,4,balanced,5.584042867024739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,4,balanced,6.935381571451823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,8,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,8,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,8,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,8,power_law_1.01,0.09605119824409485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,8,power_law_1.01,0.09564160108566284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,8,power_law_1.01,0.13455359935760497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,8,power_law_1.01,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,8,power_law_1.01,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,8,power_law_1.01,0.17244160175323486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,8,power_law_1.01,0.13455359935760497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,8,power_law_1.01,0.1931264042854309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,8,power_law_1.01,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,8,power_law_1.01,0.21155838966369628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,8,power_law_1.01,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,8,power_law_1.01,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,8,power_law_1.01,0.22855679988861083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,8,power_law_1.01,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,8,power_law_1.01,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,8,power_law_1.01,0.3092479944229126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,8,power_law_1.01,0.3803136110305786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,8,power_law_1.01,0.4419583797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,8,power_law_1.01,0.601087999343872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,8,power_law_1.01,0.8714112281799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,8,power_law_1.01,1.2783616065979004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,8,power_law_1.01,1.600921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,8,power_law_1.01,2.533990478515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,8,power_law_1.01,3.4469886779785157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,32,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,32,balanced,0.05017066498597463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,32,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,32,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,32,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,32,balanced,0.3838293155034383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,32,balanced,0.3858773310979207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,32,balanced,0.3872426748275757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,32,balanced,0.38860801855723065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,32,balanced,0.38893866539001465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,32,balanced,0.39099733034769696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,32,balanced,0.3935573498408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,32,balanced,0.3944106499354045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,32,balanced,0.3978240092595418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,8,power_law_1.01,0.5816319942474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,32,balanced,0.4020906686782837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,32,balanced,0.408405343691508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,32,balanced,0.41523198286692303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,8,power_law_1.01,0.7837696075439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,32,balanced,0.4416853189468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,32,balanced,0.4541440010070801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,8,power_law_1.01,0.9684991836547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,32,balanced,0.4910080035527547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,32,balanced,0.48076800505320233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,8,power_law_1.01,1.006156826019287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,32,balanced,0.5449386835098267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,32,balanced,0.5819733142852783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,8,power_law_1.01,0.9973759651184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,32,balanced,0.7671466668446859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,8,power_law_1.01,1.144217586517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,32,balanced,0.8920746644337972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,8,power_law_1.01,1.1644927978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,32,balanced,1.2811946868896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,8,power_law_1.01,1.1964351654052734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,32,balanced,1.7309014002482097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,8,power_law_1.01,1.2802047729492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,8,power_law_1.01,1.2720128059387208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,8,power_law_1.01,1.2525376319885253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,8,power_law_1.01,1.2974080085754394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,8,power_law_1.01,1.2810239791870117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,8,power_law_1.01,1.3721599578857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,8,power_law_1.01,1.403059196472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,8,power_law_1.01,1.404313564300537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,8,power_law_1.01,1.4495743751525878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,8,power_law_1.01,1.5224512100219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,8,power_law_1.01,1.665407943725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,8,power_law_1.01,1.824563217163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,8,power_law_1.01,2.055129623413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,8,power_law_1.01,2.5055103302001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,8,power_law_1.01,3.301580810546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,8,power_law_1.01,5.0862079620361325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,8,power_law_1.01,5.178777694702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,8,power_law_1.01,6.816563415527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,8,power_law_1.01,9.626182556152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,64,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,64,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,64,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,64,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,64,balanced,0.04606399933497111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,64,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,64,balanced,0.2285226583480835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,64,balanced,0.23517866929372153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,64,balanced,0.23637332518895468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,64,balanced,0.23705599705378214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,64,balanced,0.2387626568476359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,64,balanced,0.24285866816838583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,64,balanced,0.24473599592844644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,64,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,64,balanced,0.2582186659177144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,64,balanced,0.26282666126887005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,64,balanced,0.27613866329193115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,64,balanced,0.2974720001220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,64,balanced,0.3203413287798564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,64,balanced,0.36522666613260907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,64,balanced,0.40994131565093994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,64,balanced,0.482474684715271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,64,balanced,0.5608106851577759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,64,balanced,0.7563947041829427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,64,balanced,0.9294506708780924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,64,balanced,1.295530637105306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,64,balanced,1.6981333096822102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,2,balanced,0.02882133424282074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,2,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,2,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,2,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,2,balanced,0.24539732933044434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,2,balanced,0.2486613392829895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,2,balanced,0.2500266631444295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,2,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,2,balanced,0.25668267409006756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,2,balanced,0.2585600018501282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,2,balanced,0.2629973292350769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,2,balanced,0.27084799607594806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,2,balanced,0.27357866366704303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,2,balanced,0.28142933050791424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,2,balanced,0.292687992254893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,2,balanced,0.3027519981066386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,2,balanced,0.3199999928474426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,2,balanced,0.3548053503036499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,2,balanced,0.3781973520914714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,2,balanced,0.43195732434590656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,2,balanced,0.5213866631189982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,2,balanced,0.7616853713989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,2,balanced,0.9804800351460775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,2,balanced,1.4701226552327473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,2,balanced,1.9039573669433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,2,balanced,2.911914825439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,2,balanced,3.9082667032877603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.09564160108566284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.214630389213562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.2531327962875366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.46919679641723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.47616000175476075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.49684481620788573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.4794367790222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.5019455909729004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.5042175769805908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.5085184097290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.5244927883148194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.5443583965301514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.5679103851318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.6043647766113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.7135231971740723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.7483136177062988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.9658368110656739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,1,power_law_1.01,1.2031999588012696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,8,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,8,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,8,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,8,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,8,balanced,0.2955946723620097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,8,balanced,0.5425493319829305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,8,balanced,0.5452800194422404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,8,balanced,0.5492053429285685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,8,balanced,0.5520960092544556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,8,balanced,0.5541546742121378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,8,balanced,0.5507413148880005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,8,balanced,0.5572266578674316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,8,balanced,0.5618346532185873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,8,balanced,0.5678079922993978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,8,balanced,0.5783893267313639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,8,balanced,0.5852160056432089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,8,balanced,0.605183998743693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,8,balanced,0.637440005938212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,8,balanced,0.6732800006866455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,8,balanced,0.731818675994873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,8,balanced,0.7883093357086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,1,power_law_1.01,1.704140853881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,8,balanced,0.9098239739735922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,8,balanced,1.0676906903584797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,8,balanced,1.4271146456400554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,1,power_law_1.01,2.246041679382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,8,balanced,1.8594133059183757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,8,balanced,2.606762727101644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,8,balanced,3.34062925974528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,1,power_law_1.01,3.28642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,1,power_law_1.01,4.288076782226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,32,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,32,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,32,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,32,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,32,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,32,power_law_1.2,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,32,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,32,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,32,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,32,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,32,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,32,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,32,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,32,power_law_1.2,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,32,power_law_1.2,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,32,power_law_1.2,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,32,power_law_1.2,0.10321919918060303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,32,power_law_1.2,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,32,power_law_1.2,0.16711679697036744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,32,power_law_1.2,0.2263040065765381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,32,power_law_1.2,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,32,power_law_1.2,0.5158912181854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,32,power_law_1.2,0.7528448104858398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,32,power_law_1.2,0.9805824279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,32,power_law_1.2,1.2759039878845215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,1,power_law_1.01,6.40184326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,32,power_law_1.2,2.2841344833374024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,2,power_law_1.2,0.3219264030456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,2,power_law_1.2,0.5382080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,2,power_law_1.2,0.7249919891357421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,2,power_law_1.2,1.1950079917907714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,2,power_law_1.2,1.7129472732543944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,2,power_law_1.2,2.2605823516845702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,2,power_law_1.2,2.98986873626709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,2,power_law_1.2,3.102079963684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,2,power_law_1.2,3.2649215698242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,2,power_law_1.2,3.2278270721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,2,power_law_1.2,3.214131164550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,2,power_law_1.2,3.4572288513183596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,2,power_law_1.2,3.5665920257568358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,2,power_law_1.2,3.743743896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,2,power_law_1.2,3.854937744140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,2,power_law_1.2,3.9047168731689452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,2,power_law_1.2,4.125900650024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,2,power_law_1.2,4.369203186035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,2,power_law_1.2,4.563737487792968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,2,power_law_1.2,4.931584167480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,2,power_law_1.2,5.392793655395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,2,power_law_1.2,5.961516952514648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,2,power_law_1.2,7.008870697021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,2,power_law_1.2,8.951602935791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,2,power_law_1.2,10.294681549072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,128,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,128,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,128,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,128,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,128,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,128,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,128,balanced,0.030879999200503033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,2,power_law_1.2,13.579661560058593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,128,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,128,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,128,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,128,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,128,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,128,balanced,0.03326933334271113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,128,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,128,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,128,balanced,0.041120000183582306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,128,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,128,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,128,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,128,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,128,balanced,0.05118933320045471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,128,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,128,balanced,0.0721919983625412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,128,balanced,0.130730668703715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,128,balanced,0.1991680065790812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,128,balanced,0.3418453137079875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,128,balanced,0.45158398151397705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,2,power_law_1.2,16.867123413085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,1,power_law_1.01,8.406221008300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,32,power_law_1.2,2.7650047302246095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,2,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,2,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,2,balanced,0.09335466225941975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,2,balanced,0.30907734235127765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,2,balanced,0.5782186587651571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,2,balanced,0.7038293679555258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,2,balanced,0.7098026275634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,2,balanced,0.7140693664550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,2,balanced,0.7207252979278564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,2,balanced,0.7239680290222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,2,balanced,0.7331786950429281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,2,balanced,0.7434240182240804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,2,balanced,0.7526400089263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,2,balanced,0.7705600261688232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,2,balanced,0.787285327911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,2,balanced,0.8060586452484131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,2,balanced,0.8436053593953451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,2,balanced,0.9154559771219889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,2,balanced,0.9792853196461996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,2,balanced,1.1395413080851238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,2,balanced,1.2875093619028728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,2,balanced,1.6677546501159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,2,balanced,1.9667627016703289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,2,balanced,2.639685312906901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,2,balanced,3.3693014780680337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,2,balanced,4.974762598673503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,2,balanced,6.45137087504069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,8,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,8,balanced,0.30822400252024335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,8,balanced,0.5874346494674683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,8,balanced,1.1354453563690186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,8,balanced,2.189141273498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,8,balanced,2.7769012451171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,8,balanced,2.781183878580729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,8,balanced,2.7335678736368814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,8,balanced,2.7390292485555015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,8,balanced,2.7431252797444663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,8,balanced,2.7487573623657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,8,balanced,2.758655865987142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,8,balanced,2.7700745264689126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,8,balanced,2.783914566040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,8,balanced,2.8078079223632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,8,balanced,2.894165356953939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,8,balanced,2.9105494817097983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,8,balanced,3.3563305536905923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,8,balanced,3.03496519724528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,8,balanced,3.4761387507120767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,8,balanced,3.6647040049235025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,8,balanced,4.162560145060222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,8,balanced,3.947861353556315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,8,balanced,4.874922752380371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,8,balanced,5.544448216756185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,8,balanced,7.385578791300456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,8,balanced,9.46343994140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,64,power_law_1.2,0.020479999482631683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,64,power_law_1.2,0.02149759978055954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,64,power_law_1.2,0.020070399343967437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,64,power_law_1.2,0.020275199413299562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,64,power_law_1.2,0.020684799551963805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,64,power_law_1.2,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,64,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,64,power_law_1.2,0.02537600100040436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,64,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,64,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,64,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,64,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,64,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,64,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,64,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,64,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,64,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,64,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,64,power_law_1.2,0.12943359613418579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,64,power_law_1.2,0.14561280012130737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,64,power_law_1.2,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,64,power_law_1.2,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,64,power_law_1.2,0.3436543941497803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,64,power_law_1.2,0.8554495811462403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,2,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,2,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,2,power_law_1.2,0.07495679855346679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,2,power_law_1.2,0.12595200538635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,2,power_law_1.2,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,2,power_law_1.2,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,2,power_law_1.2,0.41553921699523927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,2,power_law_1.2,0.44503040313720704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,2,power_law_1.2,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,2,power_law_1.2,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,2,power_law_1.2,0.4730879783630371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,2,power_law_1.2,0.5087232112884521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,2,power_law_1.2,0.5050367832183837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,2,power_law_1.2,0.5332992076873779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,2,power_law_1.2,0.5584896087646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,2,power_law_1.2,0.5924863815307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,2,power_law_1.2,0.6518784046173096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,2,power_law_1.2,0.75796480178833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,2,power_law_1.2,0.8185855865478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,2,power_law_1.2,1.0973183631896972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,2,power_law_1.2,1.2607423782348632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,64,power_law_1.2,0.9095168113708496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,2,power_law_1.2,1.7147903442382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,2,power_law_1.2,2.103091239929199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,2,power_law_1.2,3.0107648849487303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,2,power_law_1.2,3.930521774291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,2,power_law_1.2,5.506854248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,2,power_law_1.2,7.595417785644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,1,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,1,power_law_1.2,0.1921023964881897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,1,power_law_1.2,0.3729151964187622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,1,power_law_1.2,0.5251071929931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,1,power_law_1.2,0.7968768119812012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,1,power_law_1.2,1.431552028656006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,1,power_law_1.2,1.4815232276916503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,1,power_law_1.2,1.5679360389709474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,1,power_law_1.2,1.665433692932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,1,power_law_1.2,1.7096704483032226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,1,power_law_1.2,1.7616895675659179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,1,power_law_1.2,1.7931903839111327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,1,power_law_1.2,1.800396728515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,1,power_law_1.2,1.818623924255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,1,power_law_1.2,1.8771968841552735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,1,power_law_1.2,1.823923110961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,1,power_law_1.2,1.967308807373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,1,power_law_1.2,2.0434944152832033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,1,power_law_1.2,2.1528575897216795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,1,power_law_1.2,2.3729856491088865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,1,power_law_1.2,2.6062847137451173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,1,power_law_1.2,3.086131286621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,1,power_law_1.2,3.516620635986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,1,power_law_1.2,4.4746753692626955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,1,power_law_1.2,5.125734329223633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,1,power_law_1.2,7.016038513183593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,1,power_law_1.2,8.534425354003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,4,power_law_1.01,0.24821119308471679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,4,power_law_1.01,0.33075199127197263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,4,power_law_1.01,0.37601280212402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,4,power_law_1.01,0.4685823917388916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,4,power_law_1.01,0.46981120109558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,4,power_law_1.01,0.4753407955169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,4,power_law_1.01,0.542310380935669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,4,power_law_1.01,0.5293888092041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,4,power_law_1.01,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,4,power_law_1.01,0.5517055988311768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,4,power_law_1.01,0.6602752208709717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,4,power_law_1.01,0.6416384220123291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,4,power_law_1.01,0.7278592109680175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,4,power_law_1.01,0.683622407913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,4,power_law_1.01,0.7573503971099853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,4,power_law_1.01,0.8247296333312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,1,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,1,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,4,power_law_1.01,1.0266624450683595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,1,power_law_1.01,0.23203840255737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,4,power_law_1.01,1.1339776039123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,1,power_law_1.01,0.3551232099533081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,1,power_law_1.01,0.4468736171722412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,1,power_law_1.01,0.7325695991516114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,1,power_law_1.01,0.7788224220275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,1,power_law_1.01,0.8015872001647949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,4,power_law_1.01,1.3094911575317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,1,power_law_1.01,0.8407039642333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,1,power_law_1.01,0.8517631530761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,1,power_law_1.01,0.8738816261291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,1,power_law_1.01,0.8650752067565918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,1,power_law_1.01,0.88985595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,1,power_law_1.01,0.9121664047241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,1,power_law_1.01,0.9387711524963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,1,power_law_1.01,0.9324543952941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,1,power_law_1.01,0.9629376411437989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,4,power_law_1.01,1.7303552627563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,1,power_law_1.01,1.0049535751342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,1,power_law_1.01,1.0868736267089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,1,power_law_1.01,1.235968017578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,1,power_law_1.01,1.366598415374756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,1,power_law_1.01,1.7082368850708007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,4,power_law_1.01,2.588672065734863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,1,power_law_1.01,1.9382272720336915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,1,power_law_1.01,2.6271743774414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,1,power_law_1.01,3.2096256256103515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,1,power_law_1.01,4.615987014770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,1,power_law_1.01,6.147481536865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,4,power_law_1.01,3.0062591552734377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,4,power_law_1.01,3.504332733154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,8,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,8,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,8,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,8,power_law_1.2,0.06306560039520263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,8,power_law_1.2,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,8,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,8,power_law_1.2,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,8,power_law_1.2,0.06716160178184509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,8,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,8,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,8,power_law_1.2,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,8,power_law_1.2,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,8,power_law_1.2,0.08417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,8,power_law_1.2,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,8,power_law_1.2,0.09400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,8,power_law_1.2,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,8,power_law_1.2,0.14172159433364867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,8,power_law_1.2,0.1984511971473694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,8,power_law_1.2,0.208076810836792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,8,power_law_1.2,0.27463679313659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,8,power_law_1.2,0.3354624032974243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,8,power_law_1.2,0.6199295997619629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,4,power_law_1.01,5.185331344604492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,8,power_law_1.2,0.9365504264831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,8,power_law_1.2,1.5134719848632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,8,power_law_1.2,1.9564544677734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,8,power_law_1.2,3.0361600875854493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,8,power_law_1.2,4.242432022094727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,8,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,8,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,8,power_law_1.2,0.20049920082092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,8,power_law_1.2,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,8,power_law_1.2,0.3072000026702881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,8,power_law_1.2,0.3670016050338745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,8,power_law_1.2,0.39976959228515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,8,power_law_1.2,0.3268608093261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,4,power_law_1.01,6.9261314392089846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,8,power_law_1.2,0.32460799217224123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,8,power_law_1.2,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,8,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,8,power_law_1.2,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,8,power_law_1.2,0.3604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,8,power_law_1.2,0.35676159858703616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,8,power_law_1.2,0.394649600982666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,8,power_law_1.2,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,8,power_law_1.2,0.41349120140075685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,8,power_law_1.2,0.4476928234100342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,8,power_law_1.2,0.5054463863372802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,8,power_law_1.2,0.577945613861084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,8,power_law_1.2,0.6946688175201416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,8,power_law_1.2,0.9449472427368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,8,power_law_1.2,1.16244478225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,8,power_law_1.2,1.6433151245117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,8,power_law_1.2,2.1807104110717774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,8,power_law_1.2,3.136921691894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,8,power_law_1.2,4.206796646118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,4,power_law_1.01,11.867750549316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,16,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,16,power_law_1.2,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,16,power_law_1.2,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,16,power_law_1.2,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,16,power_law_1.2,0.260915207862854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,16,power_law_1.2,0.18653440475463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,16,power_law_1.2,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,16,power_law_1.2,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,16,power_law_1.2,0.23180160522460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,16,power_law_1.2,0.2564095973968506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,16,power_law_1.2,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,16,power_law_1.2,0.28097920417785643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,16,power_law_1.2,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,16,power_law_1.2,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,16,power_law_1.2,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,16,power_law_1.2,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,16,power_law_1.2,0.3110912084579468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,16,power_law_1.2,0.35000319480895997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,16,power_law_1.2,0.36761600971221925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,16,power_law_1.2,0.42597122192382814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,16,power_law_1.2,0.5015552043914795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,16,power_law_1.2,0.6660096168518066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,16,power_law_1.2,0.9494400024414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,16,power_law_1.2,1.364992046356201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,16,power_law_1.2,1.7727487564086915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,16,power_law_1.2,3.014246368408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,16,power_law_1.2,4.303667068481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,4,power_law_1.01,14.070783996582032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,8,power_law_1.01,0.2070528030395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,8,power_law_1.01,0.35921919345855713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,8,power_law_1.01,0.45424637794494627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,8,power_law_1.01,0.46919679641723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,8,power_law_1.01,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,8,power_law_1.01,0.5726208209991455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,8,power_law_1.01,0.6551551818847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,8,power_law_1.01,0.5744639873504639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,8,power_law_1.01,0.6082496166229248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,8,power_law_1.01,0.6223743915557861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,8,power_law_1.01,0.586956787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,8,power_law_1.01,0.596992015838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,8,power_law_1.01,0.6002687931060791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,8,power_law_1.01,0.6299456119537353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,8,power_law_1.01,0.6518720149993896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,8,power_law_1.01,0.6662144184112548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,8,power_law_1.01,0.658022403717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,8,power_law_1.01,0.6879231929779053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,8,power_law_1.01,0.728659200668335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,8,power_law_1.01,0.7931903839111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,8,power_law_1.01,0.8683520317077636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,8,power_law_1.01,0.9781120300292969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,8,power_law_1.01,1.1661312103271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,8,power_law_1.01,1.5921152114868165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,8,power_law_1.01,1.7156032562255858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,8,power_law_1.01,2.5001983642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,8,power_law_1.01,3.0773183822631838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,16,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,16,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,16,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,16,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,16,balanced,0.025754667818546295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,16,balanced,0.02644266684850057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,16,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,16,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,16,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,16,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,16,balanced,0.02796799937884013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,16,balanced,0.0284853329261144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,16,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,16,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,16,balanced,0.03155199935038885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,16,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,16,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,16,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,16,balanced,0.04348800083001455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,16,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,16,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,16,balanced,0.09110400080680847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,16,balanced,0.11417599519093831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,16,balanced,0.22459733486175537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,16,balanced,0.3027626673380534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,16,balanced,0.4466346502304077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,16,balanced,0.5884586572647095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,2,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,2,power_law_1.01,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,2,power_law_1.01,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,2,power_law_1.01,0.20193281173706054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,2,power_law_1.01,0.30556159019470214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,2,power_law_1.01,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,2,power_law_1.01,0.466534423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,2,power_law_1.01,0.6139904022216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,2,power_law_1.01,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,2,power_law_1.01,0.6100992202758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,2,power_law_1.01,0.6459263801574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,2,power_law_1.01,0.6856704235076905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,2,power_law_1.01,0.6832128047943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,2,power_law_1.01,0.7165952205657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,2,power_law_1.01,0.7903232097625732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,2,power_law_1.01,0.8011775970458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,2,power_law_1.01,0.8437760353088379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,2,power_law_1.01,0.9367551803588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,2,power_law_1.01,1.0629119873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,2,power_law_1.01,1.319321632385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,2,power_law_1.01,1.6064512252807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,2,power_law_1.01,2.0674560546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,2,power_law_1.01,2.6116096496582033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,2,power_law_1.01,3.688243103027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,2,power_law_1.01,4.9209342956542965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,2,power_law_1.01,6.96258544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,2,power_law_1.01,8.987852478027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,16,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,16,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,16,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,16,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,16,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,16,power_law_1.2,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,16,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,16,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,16,power_law_1.2,0.02720000147819519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,16,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,16,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,16,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,16,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,16,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,16,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,16,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,16,power_law_1.2,0.05507199764251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,16,power_law_1.2,0.06450560092926025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,16,power_law_1.2,0.07677440047264099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,16,power_law_1.2,0.0972544014453888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,16,power_law_1.2,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,16,power_law_1.2,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,16,power_law_1.2,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,1,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,1,power_law_1.2,0.3014656066894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,1,power_law_1.2,0.5341184139251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,1,power_law_1.2,0.913203239440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,1,power_law_1.2,1.436467170715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,1,power_law_1.2,1.8176000595092774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,1,power_law_1.2,2.8692480087280274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,1,power_law_1.2,2.9906944274902343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,1,power_law_1.2,3.123404884338379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,1,power_law_1.2,3.2040958404541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,1,power_law_1.2,3.366502380371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,1,power_law_1.2,3.3421310424804687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,1,power_law_1.2,3.5436542510986326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,16,power_law_1.2,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,1,power_law_1.2,3.6720638275146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,1,power_law_1.2,3.836518478393555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,1,power_law_1.2,3.905331039428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,1,power_law_1.2,4.0947521209716795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,1,power_law_1.2,4.3450366973876955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,1,power_law_1.2,4.614963150024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,1,power_law_1.2,4.975001525878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,16,power_law_1.2,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,1,power_law_1.2,5.39238395690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,1,power_law_1.2,6.116966247558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,1,power_law_1.2,7.420108795166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,1,power_law_1.2,9.474457550048829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,1,power_law_1.2,10.855833435058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,1,power_law_1.2,15.112588500976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,1,power_law_1.2,18.102476501464842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,16,power_law_1.2,0.9406463623046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,16,power_law_1.2,1.3967295646667481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,32,power_law_1.01,1.060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,32,power_law_1.01,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,32,power_law_1.01,1.0547200202941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,32,power_law_1.01,1.0547200202941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,32,power_law_1.01,1.0082304000854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,32,power_law_1.01,0.7555071830749511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,32,power_law_1.01,0.8613887786865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,32,power_law_1.01,1.0057727813720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,32,power_law_1.01,1.034444808959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,32,power_law_1.01,1.0373120307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,32,power_law_1.01,0.9660415649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,32,power_law_1.01,1.0711039543151855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,32,power_law_1.01,1.054310417175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,32,power_law_1.01,1.0827775955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,32,power_law_1.01,1.1237312316894532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,32,power_law_1.01,1.1165696144104005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,32,power_law_1.01,1.0680319786071777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,32,power_law_1.01,1.2101632118225099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,32,power_law_1.01,1.2781567573547363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,32,power_law_1.01,1.4006272315979005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,32,power_law_1.01,1.5781888008117675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,32,power_law_1.01,1.847091293334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,32,power_law_1.01,2.573516845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,32,power_law_1.01,3.5145729064941404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,32,power_law_1.01,3.7607425689697265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,32,power_law_1.01,5.100339126586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,32,power_law_1.01,6.747341156005859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,4,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,4,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,4,balanced,0.07798933486143748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,4,balanced,0.30481066306432086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,4,balanced,0.5896533330281576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,4,balanced,0.7287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,4,balanced,0.7328426837921143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,4,balanced,0.7304533322652181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,4,balanced,0.7336906592051188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,4,balanced,0.736255963643392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,4,balanced,0.7417173385620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,4,balanced,0.7471786340077718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,4,balanced,0.7519573370615641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,4,balanced,0.7621973355611166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,4,balanced,0.773973306020101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,4,balanced,0.8087733586629232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,4,balanced,0.8178186416625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,4,balanced,0.8550399939219157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,4,balanced,0.904533306757609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,4,balanced,0.971776008605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,4,balanced,1.0584746996561687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,4,balanced,1.3199360370635986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,4,balanced,1.5831039746602376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,4,balanced,2.14630397160848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,4,balanced,2.6424320538838706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,4,balanced,3.7452799479166665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,4,balanced,4.846591949462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,16,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,16,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,16,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,16,balanced,0.29201066493988037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,16,balanced,0.5396480162938436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,16,balanced,1.0313173135121663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,16,balanced,1.5206185976664226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,16,balanced,1.5269546508789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,16,balanced,1.528831958770752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,16,balanced,1.5303680102030437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,16,balanced,1.536512056986491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,16,balanced,1.5438507397969563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,16,balanced,1.546240011850993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,16,balanced,1.557674725850423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,16,balanced,1.5706453323364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,16,balanced,1.5788373947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,16,balanced,1.5998293558756511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,16,balanced,1.6302080154418945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,16,balanced,1.666218598683675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,16,balanced,1.7339413960774739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,16,balanced,1.793706734975179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,16,balanced,1.925103982289632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,16,balanced,2.0302507082621255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,16,balanced,2.295466740926107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,16,balanced,2.599936008453369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,16,balanced,3.2870400746663413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,16,balanced,4.033535957336426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,4,balanced,0.31112533807754517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,4,balanced,0.5387946764628092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,4,balanced,1.055573304494222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,4,balanced,2.07479461034139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,4,balanced,4.178943951924642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,4,balanced,7.984629313151042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,4,balanced,11.959978739420572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,4,balanced,11.955711364746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,4,balanced,11.962880452473959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,4,balanced,11.976362864176432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,4,balanced,12.140543619791666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,4,balanced,12.152661641438803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,4,balanced,12.172964731852213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,4,balanced,12.084885915120443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,4,balanced,12.110677083333334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,4,balanced,12.116458892822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,4,balanced,12.18167495727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,4,balanced,12.312063852945963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,4,balanced,12.761941274007162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,4,balanced,13.019648234049479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,2,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,2,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,2,balanced,0.24541866779327393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,2,balanced,0.4599466721216838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,4,balanced,13.307562510172525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,2,balanced,0.8773972988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,2,balanced,0.879957358042399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,2,balanced,0.8852480252583822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,2,balanced,0.8905386924743652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,2,balanced,0.8944640159606934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,2,balanced,0.899072011311849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,2,balanced,0.9065813223520914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,2,balanced,0.9149440129597982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,2,balanced,0.923962672551473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,2,balanced,0.9376426537831625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,2,balanced,0.9533440272013346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,2,balanced,0.9686773618062338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,4,balanced,13.758463541666666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,2,balanced,1.0018080075581868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,2,balanced,1.0584746996561687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,2,balanced,1.1187199751536052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,2,balanced,1.193984031677246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,2,balanced,1.3095253308614094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,2,balanced,1.5701066652933757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,2,balanced,1.8109439214070637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,4,balanced,15.988906860351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,2,balanced,2.3369386990865073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,2,balanced,2.9264214833577475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,2,balanced,4.274346669514974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,2,balanced,5.691551844278972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,4,balanced,17.080149332682293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,4,balanced,17.306453704833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,4,balanced,19.88915252685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,16,power_law_1.01,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,16,power_law_1.01,0.22035200595855714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,16,power_law_1.01,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,16,power_law_1.01,0.19886080026626587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,16,power_law_1.01,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,16,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,16,power_law_1.01,0.232857608795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,16,power_law_1.01,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,16,power_law_1.01,0.24145278930664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,16,power_law_1.01,0.23019518852233886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,16,power_law_1.01,0.25866239070892333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,16,power_law_1.01,0.24965119361877441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,16,power_law_1.01,0.26296319961547854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,16,power_law_1.01,0.2703360080718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,16,power_law_1.01,0.266431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,4,balanced,20.306772867838543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,16,power_law_1.01,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,16,power_law_1.01,0.2758656024932861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,16,power_law_1.01,0.2973695993423462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,16,power_law_1.01,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,16,power_law_1.01,0.3852288007736206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,16,power_law_1.01,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,16,power_law_1.01,0.5922815799713135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,16,power_law_1.01,0.7065599918365478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,16,power_law_1.01,1.0215423583984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,16,power_law_1.01,1.4653440475463868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,16,power_law_1.01,2.3998464584350585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,16,power_law_1.01,3.4383872985839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,4,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,4,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,4,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,4,balanced,0.04111466556787491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,4,balanced,0.13294933239618936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,4,balanced,0.3500373363494873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,4,balanced,0.35037867228190106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,4,balanced,0.35310932000478107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,4,balanced,0.3542933464050293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,4,balanced,0.3547999858856201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,4,balanced,0.35703468322753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,4,balanced,0.3601066668828328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,4,balanced,0.36300798257191974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,4,balanced,0.3671040137608846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,4,balanced,0.3742719888687134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,4,balanced,0.3985066811243693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,4,balanced,0.39321601390838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,4,balanced,0.4121599992116292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,4,balanced,0.43025068442026776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,4,balanced,0.4505600134531657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,4,balanced,0.4925440152486165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,4,balanced,0.5831679900487264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,4,balanced,0.6802773475646973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,4,balanced,0.9787733554840088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,4,balanced,1.250986655553182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,4,balanced,1.7940479914347331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,4,balanced,2.32806396484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,32,power_law_1.01,0.5990399837493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,32,power_law_1.01,0.5386240005493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,32,power_law_1.01,0.5582848072052002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,32,power_law_1.01,0.5445631980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,32,power_law_1.01,0.4956160068511963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,32,power_law_1.01,0.411846399307251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,32,power_law_1.01,0.5130239963531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,32,power_law_1.01,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,32,power_law_1.01,0.5240831851959229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,32,power_law_1.01,0.5253119945526123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,32,power_law_1.01,0.46735358238220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,32,power_law_1.01,0.5089280128479003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,32,power_law_1.01,0.5510975837707519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,32,power_law_1.01,0.4947968006134033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,32,power_law_1.01,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,32,power_law_1.01,0.5814271926879883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,32,power_law_1.01,0.5746687889099121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,32,power_law_1.01,0.601087999343872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,32,power_law_1.01,0.6733503818511963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,32,power_law_1.01,0.734822416305542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,32,power_law_1.01,0.8658623695373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,32,power_law_1.01,1.0651519775390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,32,power_law_1.01,1.315225601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,32,power_law_1.01,1.7772544860839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,32,power_law_1.01,2.274297523498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,32,power_law_1.01,3.2143360137939454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,32,power_law_1.01,4.704051208496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,64,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,64,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,64,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,64,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,64,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,64,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,64,power_law_1.01,0.0315200001001358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,64,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,64,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,64,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,64,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,64,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,64,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,64,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,64,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,64,power_law_1.01,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,64,power_law_1.01,0.14561280012130737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,64,power_law_1.01,0.16097279787063598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,64,power_law_1.01,0.2002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,64,power_law_1.01,0.24576001167297362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,64,power_law_1.01,0.3919872045516968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,64,power_law_1.01,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,64,power_law_1.01,0.8417280197143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,64,power_law_1.01,0.9955327987670899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,16,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,16,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,16,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,16,balanced,0.169813334941864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,16,balanced,0.353279987970988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,16,balanced,0.6754986445109049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,16,balanced,0.6780587037404379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,16,balanced,0.6731093724568685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,16,balanced,0.6753280162811279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,16,balanced,0.6758399804433187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,16,balanced,0.6780587037404379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,16,balanced,0.6816426912943522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,16,balanced,0.683690627415975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,16,balanced,0.6876160303751627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,16,balanced,0.694271961847941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,16,balanced,0.6980266571044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,16,balanced,0.7140693664550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,16,balanced,0.7313066323598226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,16,balanced,0.7473493417104086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,16,balanced,0.7393279870351156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,16,balanced,0.7755093574523926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,16,balanced,0.8386560281117758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,16,balanced,0.8830293019612631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,16,balanced,1.0059093634287517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,16,balanced,1.0873173077901204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,16,balanced,1.4071466128031414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,16,balanced,1.799850622812907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,64,power_law_1.01,0.03028480112552643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,64,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,64,power_law_1.01,0.02988159954547882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,64,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,64,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,64,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,64,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,64,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,64,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,64,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,64,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,64,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,64,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,64,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,64,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,64,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,64,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,64,power_law_1.01,0.09953280091285706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,64,power_law_1.01,0.1412992000579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,64,power_law_1.01,0.1978368043899536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,64,power_law_1.01,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,64,power_law_1.01,0.45137920379638674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,64,power_law_1.01,0.6148096084594726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,64,power_law_1.01,0.9457663536071778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,64,power_law_1.01,1.427455997467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,64,power_law_1.01,1.8339839935302735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,128,power_law_1.2,0.46141438484191893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,128,power_law_1.2,0.41594882011413575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,128,power_law_1.2,0.41656317710876467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,128,power_law_1.2,0.41656317710876467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,128,power_law_1.2,0.36618239879608155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,128,power_law_1.2,0.39628798961639405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,128,power_law_1.2,0.37068800926208495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,128,power_law_1.2,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,128,power_law_1.2,0.42598400115966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,128,power_law_1.2,0.4009856224060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,128,power_law_1.2,0.37662720680236816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,128,power_law_1.2,0.4069375991821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,128,power_law_1.2,0.38338561058044435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,128,power_law_1.2,0.43662080764770506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,128,power_law_1.2,0.4616191864013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,128,power_law_1.2,0.45608959197998045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,128,power_law_1.2,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,128,power_law_1.2,0.49848318099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,128,power_law_1.2,0.5165056228637696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,128,power_law_1.2,0.8316927909851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,128,power_law_1.2,0.8671232223510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,128,power_law_1.2,1.2543999671936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,128,power_law_1.2,1.5798272132873534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,128,power_law_1.2,2.3148544311523436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,128,power_law_1.2,3.321241760253906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,128,power_law_1.2,5.498470306396484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,128,power_law_1.2,7.368294525146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,256,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,256,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,256,balanced,0.03853866706291834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,256,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,256,balanced,0.038890667259693146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,256,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,256,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,256,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,256,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,256,balanced,0.041120000183582306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,256,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,256,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,256,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,256,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,256,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,256,balanced,0.04741866886615753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,256,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,256,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,256,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,256,balanced,0.06690133114655812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,256,balanced,0.07574933270613353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,256,balanced,0.09181867043177287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,256,balanced,0.11076266566912334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,256,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,256,balanced,0.3324586749076843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,256,balanced,0.49322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,256,balanced,0.6541653474171957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.30945279598236086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,16,power_law_1.01,0.025388801097869874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.5912576198577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,16,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,16,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.9623552322387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,16,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,16,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,1,power_law_1.01,1.3334527969360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,16,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,16,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,16,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,16,power_law_1.01,0.02515200078487396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,1,power_law_1.01,2.166579246520996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,16,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,16,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,16,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,1,power_law_1.01,2.3476224899291993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,16,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,16,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,16,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,16,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,1,power_law_1.01,2.367283248901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,16,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,16,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,16,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,1,power_law_1.01,2.4479743957519533
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,16,power_law_1.01,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,16,power_law_1.01,0.07696639895439147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,16,power_law_1.01,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,1,power_law_1.01,2.510643196105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,16,power_law_1.01,0.15646719932556152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,16,power_law_1.01,0.2732032060623169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,1,power_law_1.01,2.615500831604004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,16,power_law_1.01,0.38543360233306884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,16,power_law_1.01,0.5371903896331787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,1,power_law_1.01,2.73305606842041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,16,power_law_1.01,0.8441856384277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,1,power_law_1.01,2.6968063354492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,1,power_law_1.01,2.8438528060913084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,1,power_law_1.01,2.9313024520874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,1,power_law_1.01,2.939494323730469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,1,power_law_1.01,3.1072256088256838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,1,power_law_1.01,3.2901119232177733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,1,power_law_1.01,3.4414592742919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,1,power_law_1.01,3.888947296142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,1,power_law_1.01,4.128358459472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,1,power_law_1.01,5.067366409301758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,1,power_law_1.01,6.107750320434571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,1,power_law_1.01,8.254259490966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,1,power_law_1.01,9.583821105957032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,1,power_law_1.01,13.626777648925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,1,power_law_1.01,17.75308837890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,8,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,8,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,8,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,8,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,8,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,8,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,8,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,8,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,8,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,8,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,8,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,8,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,8,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,8,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,8,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,8,balanced,0.06519466638565063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,8,balanced,0.06963199873765309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,8,balanced,0.0791786660750707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,8,balanced,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,8,balanced,0.23091200987497965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,8,balanced,0.29286400477091473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,8,balanced,0.40174933274586994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,8,balanced,0.5544960101445516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,8,balanced,0.9021440347035726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,8,balanced,1.2503039836883545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,8,balanced,1.9553279876708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,8,balanced,2.715989430745443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,16,power_law_1.2,0.3590143918991089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,16,power_law_1.2,0.6520832061767579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,16,power_law_1.2,0.6225920200347901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,16,power_law_1.2,0.5953536033630371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,1,power_law_1.2,1.0307583808898926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,16,power_law_1.2,0.6465536117553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,1,power_law_1.2,1.735647964477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,16,power_law_1.2,0.5132287979125977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,1,power_law_1.2,2.55098876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,16,power_law_1.2,0.5982207775115966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,16,power_law_1.2,0.6094848155975342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,16,power_law_1.2,0.6260608196258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,1,power_law_1.2,3.855769729614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,16,power_law_1.2,0.5781504154205322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,16,power_law_1.2,0.631603193283081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,1,power_law_1.2,4.068966293334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,16,power_law_1.2,0.6201344013214112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,16,power_law_1.2,0.6072319984436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,16,power_law_1.2,0.5943295955657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,1,power_law_1.2,4.089440155029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,16,power_law_1.2,0.6076416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,16,power_law_1.2,0.6543231964111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,16,power_law_1.2,0.668671989440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,1,power_law_1.2,4.435148620605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,16,power_law_1.2,0.7360511779785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,16,power_law_1.2,0.7673855781555176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,16,power_law_1.2,0.879206371307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,1,power_law_1.2,4.630118560791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,16,power_law_1.2,0.9891839981079101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,16,power_law_1.2,1.3834176063537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,1,power_law_1.2,5.04791030883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,16,power_law_1.2,1.396326446533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,16,power_law_1.2,2.0307968139648436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,1,power_law_1.2,5.201907348632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,16,power_law_1.2,2.121932792663574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,1,power_law_1.2,4.7771648406982425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,16,power_law_1.2,3.6507648468017577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,1,power_law_1.2,5.144166564941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,16,power_law_1.2,4.811775970458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,1,power_law_1.2,5.390745544433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,1,power_law_1.2,5.901516723632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,1,power_law_1.2,6.718463897705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,1,power_law_1.2,7.122930908203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,1,power_law_1.2,8.334336090087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,1,power_law_1.2,10.384140777587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,1,power_law_1.2,12.249088287353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,4,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,4,power_law_1.2,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,4,power_law_1.2,0.15421439409255983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,4,power_law_1.2,0.2883519887924194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,4,power_law_1.2,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,4,power_law_1.2,0.41736321449279784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,4,power_law_1.2,0.44072961807250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,4,power_law_1.2,0.44072961807250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,4,power_law_1.2,0.45608959197998045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,4,power_law_1.2,0.46099200248718264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,4,power_law_1.2,0.47083520889282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,4,power_law_1.2,0.4597760200500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,4,power_law_1.2,0.48353281021118166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,4,power_law_1.2,0.4827136039733887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,4,power_law_1.2,0.49786877632141113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,4,power_law_1.2,0.5091328144073486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,4,power_law_1.2,0.5083136081695556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,4,power_law_1.2,0.5855231761932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,4,power_law_1.2,0.6242303848266602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,1,power_law_1.2,14.629273986816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,4,power_law_1.2,0.728652811050415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,4,power_law_1.2,0.8353535652160644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,4,power_law_1.2,1.100595188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,4,power_law_1.2,1.3323967933654786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,1,power_law_1.2,16.741990661621095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,4,power_law_1.2,1.8262016296386718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,1,power_law_1.2,20.367768859863283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,4,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,4,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,4,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,4,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,4,balanced,0.14899200201034546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,4,balanced,0.3572053511937459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,4,balanced,0.3590826590855916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,4,balanced,0.36181334654490155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,4,balanced,0.3633493185043335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,4,balanced,0.36403199036916095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,4,balanced,0.3653973340988159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,4,balanced,0.3703306516011556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,4,balanced,0.37307735284169513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,4,balanced,0.37852799892425537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,4,balanced,0.385535995165507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,4,balanced,0.39048532644907635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,4,balanced,0.4005546569824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,4,balanced,0.4227413336435954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,4,balanced,0.44544001420338947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,4,balanced,0.4864000082015991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,4,power_law_1.2,2.4336383819580076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,4,balanced,0.5331626733144125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,4,balanced,0.6116693417231241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,4,balanced,0.6930773258209229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,4,balanced,0.92194135983785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,4,balanced,1.1653119723002117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,4,balanced,1.6558079719543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,4,balanced,2.21781333287557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,1,power_law_1.2,24.253439331054686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,4,power_law_1.2,3.4115585327148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,1,power_law_1.2,31.506021118164064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,1,power_law_1.2,37.720883178710935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,64,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,64,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,64,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,64,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,64,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,64,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,64,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,64,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,64,balanced,0.0260959987839063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,64,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,64,balanced,0.026421333352724712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,64,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,64,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,64,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,64,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,64,balanced,0.031541332602500916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,64,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,64,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,64,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,64,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,64,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,64,balanced,0.05919999877611796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,64,balanced,0.07388799885908763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,64,balanced,0.1609386702378591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,64,balanced,0.2187946637471517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,4,balanced,0.5290613174438477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,4,balanced,0.4734293222427368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,4,balanced,0.9067520300547282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,4,balanced,0.912554661432902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,4,balanced,0.9096533457438151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,4,balanced,0.9156266848246256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,4,balanced,0.9200639724731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,4,balanced,0.9216000239054362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,4,balanced,0.9425919850667318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,4,balanced,0.9448106288909912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,4,balanced,0.9524906476338705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,4,balanced,0.9642666975657145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,4,balanced,0.966485341389974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,4,balanced,0.9854293664296468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,4,balanced,1.4936693509419758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,4,balanced,1.5211520195007324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,4,balanced,1.682597319285075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,4,balanced,2.1558507283528647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,4,balanced,2.8183892567952475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,4,balanced,3.783151944478353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,4,balanced,4.666703859965007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,4,balanced,5.7864532470703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,4,balanced,6.928042729695638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,4,balanced,8.713045120239258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,4,balanced,10.378069559733072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,4,balanced,13.573973337809244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,4,balanced,16.652266184488933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,4,power_law_1.2,4.841267013549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,1,power_law_1.2,51.662420654296874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,64,power_law_1.2,0.799948787689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,64,power_law_1.2,0.799129581451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,64,power_law_1.2,0.8050496101379394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,64,power_law_1.2,0.7995391845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,64,power_law_1.2,0.7505919933319092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,64,power_law_1.2,0.6809599876403809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,64,power_law_1.2,0.5531648159027099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,64,power_law_1.2,0.6555647850036621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,64,power_law_1.2,0.6834176063537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,64,power_law_1.2,0.7358463764190674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,64,power_law_1.2,0.7124991893768311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,64,power_law_1.2,0.7921664237976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,64,power_law_1.2,0.7938047885894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,64,power_law_1.2,0.7526400089263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,64,power_law_1.2,0.7708608150482178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,64,power_law_1.2,0.8185855865478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,64,power_law_1.2,0.9531392097473145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,64,power_law_1.2,0.8531968116760253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,64,power_law_1.2,0.9021439552307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,64,power_law_1.2,1.1735039710998536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,64,power_law_1.2,1.2378111839294434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,64,power_law_1.2,1.5384575843811035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,64,power_law_1.2,1.9107839584350585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,64,power_law_1.2,2.733875274658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,64,power_law_1.2,4.0454143524169925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,64,power_law_1.2,5.843148803710937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,64,power_law_1.2,6.014566421508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,1,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,1,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,1,power_law_1.01,0.2910207986831665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,1,power_law_1.01,0.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,1,power_law_1.01,0.8022015571594239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,1,power_law_1.01,1.0682368278503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,1,power_law_1.01,1.4508031845092773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,1,power_law_1.01,1.5327232360839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,1,power_law_1.01,1.6486400604248046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,1,power_law_1.01,1.664614486694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,1,power_law_1.01,1.7207296371459961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,1,power_law_1.01,1.7793024063110352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,1,power_law_1.01,1.8507776260375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,1,power_law_1.01,1.9224576950073242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,1,power_law_1.01,1.968320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,1,power_law_1.2,64.80117797851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,1,power_law_1.01,2.0174848556518556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,1,power_law_1.01,2.106982421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,1,power_law_1.01,2.3420927047729494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,1,power_law_1.01,2.5257984161376954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,1,power_law_1.01,2.891366386413574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,1,power_law_1.01,3.3126399993896483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,1,power_law_1.01,3.971481704711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,1,power_law_1.01,4.713676834106446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,1,power_law_1.01,6.219980621337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,1,power_law_1.01,7.5284477233886715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,1,power_law_1.01,10.699366760253906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,8,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,8,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,8,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,8,balanced,0.24797866741816202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,8,balanced,0.45892266432444256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,8,balanced,0.4608000119527181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,8,balanced,0.4621653159459432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,8,balanced,0.4648960034052531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,8,balanced,0.4659200112024943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,8,balanced,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,8,balanced,0.4626773198445638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,8,balanced,0.4648960034052531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,8,balanced,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,8,balanced,0.4751360019048055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,8,balanced,0.4814506769180298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,8,balanced,0.48793598016103107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,8,balanced,0.5053439935048422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,8,balanced,0.5256533225377401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,8,balanced,0.5454506476720175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,8,balanced,0.5703573226928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,8,balanced,0.6150826613108317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,8,balanced,0.688810666402181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,8,balanced,0.7819946606953939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,1,power_law_1.01,13.791845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,8,balanced,1.0412373542785645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,8,balanced,1.3165226777394612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,8,balanced,1.9822932879130046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,8,balanced,2.70796807607015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,16,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,16,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,16,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,16,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,16,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,16,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,16,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,16,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,16,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,16,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,16,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,16,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,16,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,16,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,16,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,16,power_law_1.2,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,16,power_law_1.2,0.1171455979347229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,16,power_law_1.2,0.17059839963912965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,16,power_law_1.2,0.25395200252532957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,16,power_law_1.2,0.2977792024612427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,16,power_law_1.2,0.46242561340332033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,16,power_law_1.2,0.5943295955657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,16,power_law_1.2,1.0110976219177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,16,power_law_1.2,1.1909119606018066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,8,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,8,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,8,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,8,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,8,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,8,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,8,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,8,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,8,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,8,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,8,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,8,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,8,balanced,0.08618666728337605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,8,balanced,0.0988159974416097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,8,balanced,0.11211199561754863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,8,balanced,0.1628159979979197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,8,balanced,0.22323199113210043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,8,balanced,0.2986666758855184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,8,balanced,0.3717120091120402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,8,balanced,0.5239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,8,balanced,0.6679893334706625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,8,balanced,1.0023252964019775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,8,balanced,1.358847935994466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,8,balanced,2.0188159942626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,8,balanced,2.709674517313639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,64,power_law_1.01,0.6006783962249755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,64,power_law_1.01,0.5406720161437988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,64,power_law_1.01,0.5404672145843505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,64,power_law_1.01,0.5416959762573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,64,power_law_1.01,0.46755199432373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,64,power_law_1.01,0.497049617767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,64,power_law_1.01,0.5242879867553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,64,power_law_1.01,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,64,power_law_1.01,0.5527552127838135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,64,power_law_1.01,0.5285888195037842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,64,power_law_1.01,0.48289918899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,64,power_law_1.01,0.5122047901153565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,64,power_law_1.01,0.5140223979949952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,64,power_law_1.01,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,64,power_law_1.01,0.597811222076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,64,power_law_1.01,0.6074368000030518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,64,power_law_1.01,0.5791744232177735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,64,power_law_1.01,0.6813695907592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,64,power_law_1.01,0.748524808883667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,64,power_law_1.01,0.8278016090393067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,64,power_law_1.01,1.195622444152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,64,power_law_1.01,1.4338047981262207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,16,power_law_1.2,2.147327995300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,64,power_law_1.01,1.7903615951538085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,64,power_law_1.01,2.4832000732421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,64,power_law_1.01,3.2847873687744142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,64,power_law_1.01,6.03873291015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,64,power_law_1.01,6.729933166503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,8,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,8,power_law_1.2,0.17589759826660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,8,power_law_1.2,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,8,power_law_1.2,0.2988032102584839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,8,power_law_1.2,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,8,power_law_1.2,0.33402879238128663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,8,power_law_1.2,0.32604160308837893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,8,power_law_1.2,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,8,power_law_1.2,0.3831423997879028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,8,power_law_1.2,0.342630410194397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,8,power_law_1.2,0.3889152050018311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,8,power_law_1.2,0.3841856002807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,8,power_law_1.2,0.38338561058044435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,8,power_law_1.2,0.393830394744873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,8,power_law_1.2,0.4069119930267334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,8,power_law_1.2,0.4325376033782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,8,power_law_1.2,0.4429823875427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,8,power_law_1.2,0.48619518280029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,8,power_law_1.2,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,8,power_law_1.2,0.5941247940063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,8,power_law_1.2,0.668671989440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,8,power_law_1.2,0.9848832130432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,16,power_law_1.2,2.7437055587768553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,8,power_law_1.2,1.3696640014648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,8,power_law_1.2,1.8829311370849608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,8,power_law_1.2,2.4377344131469725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,8,power_law_1.2,3.7238784790039063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,8,power_law_1.2,4.85847053527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,2,balanced,0.067071999112765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,2,balanced,0.2940586606661479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,2,balanced,0.5331626733144125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,2,balanced,1.032533327738444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,2,balanced,2.065066655476888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,2,balanced,3.9843839009602866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,2,balanced,5.948757171630859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,2,balanced,5.961045583089192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,2,balanced,5.977429072062175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,2,balanced,5.987669626871745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,2,balanced,6.014293034871419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,2,balanced,6.037845611572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,2,balanced,6.059349060058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,2,balanced,6.0997975667317705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,2,balanced,6.137343724568685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,2,balanced,6.188032150268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,2,balanced,6.240421295166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,2,balanced,6.3648427327473955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,2,balanced,6.48089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,2,balanced,6.718634923299153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,2,balanced,6.9447682698567705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,2,balanced,7.432533264160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,2,balanced,7.7965653737386065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,2,balanced,8.679936091105143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,2,balanced,9.42079989115397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,2,balanced,11.390975952148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,2,balanced,13.951146443684896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,1,power_law_1.01,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,1,power_law_1.01,0.3637248039245605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,1,power_law_1.01,0.6653759956359864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,1,power_law_1.01,1.3039487838745116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,1,power_law_1.01,1.9687423706054688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,1,power_law_1.01,2.6091520309448244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,1,power_law_1.01,3.667148971557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,1,power_law_1.01,3.8961151123046873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,1,power_law_1.01,3.9743488311767576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,1,power_law_1.01,4.069990539550782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,1,power_law_1.01,4.20392951965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,128,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,128,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,128,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,128,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,128,power_law_1.01,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,1,power_law_1.01,4.324761581420899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,128,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,128,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,128,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,128,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,128,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,128,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,128,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,1,power_law_1.01,4.460134506225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,128,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,128,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,128,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,128,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,128,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,128,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,1,power_law_1.01,4.621311950683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,128,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,128,power_law_1.01,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,128,power_law_1.01,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,128,power_law_1.01,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,128,power_law_1.01,0.12779519557952881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,1,power_law_1.01,4.65162239074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,128,power_law_1.01,0.2052095890045166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,128,power_law_1.01,0.33669118881225585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,128,power_law_1.01,0.5199872016906738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,1,power_law_1.01,4.790886306762696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,128,power_law_1.01,0.7211008071899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,1,power_law_1.01,4.860313415527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,1,power_law_1.01,5.124095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,1,power_law_1.01,5.111808013916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,1,power_law_1.01,5.4335487365722654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,1,power_law_1.01,5.797068786621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,1,power_law_1.01,6.5603584289550785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,1,power_law_1.01,7.353753662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,1,power_law_1.01,8.90490264892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,1,power_law_1.01,9.770598602294921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,1,power_law_1.01,13.033062744140626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,1,power_law_1.01,16.348979187011718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,4,power_law_1.2,0.7555071830749511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,4,power_law_1.2,1.1180031776428223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,4,power_law_1.2,1.5843328475952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,4,power_law_1.2,2.1325824737548826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,4,power_law_1.2,2.5732927322387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,4,power_law_1.2,3.7621761322021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,4,power_law_1.2,3.5913726806640627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,4,power_law_1.2,3.7117950439453127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,4,power_law_1.2,3.500646209716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,4,power_law_1.2,3.751116943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,4,power_law_1.2,3.688243103027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,4,power_law_1.2,3.9577598571777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,4,power_law_1.2,4.016128158569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,4,power_law_1.2,4.029811096191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,4,power_law_1.2,4.281958389282226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,4,power_law_1.2,4.261478424072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,4,power_law_1.2,4.442521667480468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,4,power_law_1.2,4.314316940307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,4,power_law_1.2,4.626220703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,4,power_law_1.2,4.949196624755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,4,power_law_1.2,5.618892669677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,4,power_law_1.2,6.8878334045410154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,4,power_law_1.2,7.096934509277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,4,power_law_1.2,9.464627075195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,2,power_law_1.2,0.44359679222106935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,2,power_law_1.2,0.6766592025756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,2,power_law_1.2,0.6768640041351318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,2,power_law_1.2,1.0328000068664551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,2,power_law_1.2,1.0350591659545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,4,power_law_1.2,10.426777648925782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,2,power_law_1.2,1.0579775810241698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,2,power_law_1.2,1.103872013092041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,2,power_law_1.2,1.1794048309326173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,2,power_law_1.2,1.3271039962768554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,2,power_law_1.2,1.2916735649108886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,2,power_law_1.2,1.18538236618042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,2,power_law_1.2,1.3629440307617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,2,power_law_1.2,1.3461503982543945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,2,power_law_1.2,1.496678352355957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,2,power_law_1.2,1.6670719146728517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,2,power_law_1.2,1.7534975051879882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,4,power_law_1.2,15.069389343261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,2,power_law_1.2,1.924095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,2,power_law_1.2,2.3863296508789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,2,power_law_1.2,2.513100814819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,4,power_law_1.2,18.758438110351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,2,power_law_1.2,3.102310371398926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,2,power_law_1.2,3.738175964355469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,2,power_law_1.2,5.307187271118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,2,power_law_1.2,6.193971252441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,2,power_law_1.2,8.160460662841796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,2,power_law_1.2,9.423052978515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,2,power_law_1.2,13.974937438964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,64,power_law_1.01,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,64,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,64,power_law_1.01,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,64,power_law_1.01,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,64,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,64,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,64,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,64,power_law_1.01,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,64,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,64,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,64,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,64,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,64,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,64,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,64,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,64,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,64,power_law_1.01,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,64,power_law_1.01,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,64,power_law_1.01,0.15360000133514404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,64,power_law_1.01,0.24453120231628417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,64,power_law_1.01,0.3764031887054443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,64,power_law_1.01,0.5038080215454102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,1,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,1,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,1,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,1,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,1,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,1,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,1,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,1,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,1,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,1,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,1,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,1,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,1,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,1,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,1,balanced,0.09283733367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,1,balanced,0.11929600437482198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,1,balanced,0.16247466206550598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,1,balanced,0.20787199338277182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,1,balanced,0.23381332556406656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,1,balanced,0.2892799973487854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,1,balanced,0.36420265833536786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,1,balanced,0.5346986850102743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,1,balanced,0.7019519805908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,1,balanced,1.13373867670695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,1,balanced,1.5467519760131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,1,balanced,2.451456069946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,1,balanced,3.3648640314737954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,2,power_law_1.2,21.267047119140624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,4,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,4,balanced,0.041450666884581246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,4,balanced,0.23958933353424072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,4,balanced,0.45123199621836346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,4,balanced,0.8796106974283854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,4,balanced,0.8852480252583822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,4,balanced,0.8893226782480875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,4,balanced,0.884394645690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,4,balanced,0.8878080050150553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,4,balanced,0.8905226389567057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,4,balanced,0.8970239957173666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,4,balanced,0.9026559988657633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,4,balanced,0.9089706738789877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,4,balanced,0.91921067237854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,4,balanced,0.934229294459025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,4,balanced,0.9451519648234049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,4,balanced,0.9704106648763021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,4,balanced,1.0216106573740642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,4,balanced,1.0610346794128418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,4,balanced,1.1074559688568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,4,balanced,1.1745279630025227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,4,balanced,1.323520024617513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,4,balanced,1.504085381825765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,4,balanced,1.9247786204020183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,4,balanced,2.41100804011027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,4,balanced,3.5213279724121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,8,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,8,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,8,power_law_1.2,0.032953599095344545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,8,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,8,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,4,balanced,4.630869229634603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,8,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,8,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,8,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,8,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,8,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,8,power_law_1.2,0.08048639893531799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,8,power_law_1.2,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,8,power_law_1.2,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,8,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,8,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,8,balanced,0.04384533564249674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,8,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,8,power_law_1.2,0.1411072015762329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,8,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,8,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,8,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,8,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,8,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,8,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,8,balanced,0.060405333836873375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,8,power_law_1.2,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,8,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,8,balanced,0.06331733365853627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,8,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,8,balanced,0.07031466563542683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,8,balanced,0.07165333131949107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,8,balanced,0.08618666728337605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,8,balanced,0.15223466356595358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,8,balanced,0.21333332856496176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,8,balanced,0.29098665714263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,8,power_law_1.2,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,8,balanced,0.3375786542892456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,8,balanced,0.45653335253397626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,8,balanced,0.5956266721089681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,8,balanced,0.943610668182373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,8,balanced,1.3393920262654622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,8,balanced,2.0507307052612305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,8,balanced,2.809173266092936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,8,power_law_1.2,0.26972160339355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,8,power_law_1.2,0.37867519855499265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,8,power_law_1.2,0.5414912223815918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,8,power_law_1.2,0.7923711776733399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,8,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,8,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,8,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,8,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,8,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,8,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,8,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,8,power_law_1.2,0.061427199840545656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,8,power_law_1.2,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,8,power_law_1.2,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,8,power_law_1.2,0.11448320150375366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,8,power_law_1.2,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,8,power_law_1.2,0.12267520427703857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,8,power_law_1.2,0.15892479419708253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,8,power_law_1.2,0.17244160175323486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,8,power_law_1.2,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,8,power_law_1.2,0.37396481037139895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,8,power_law_1.2,0.475545597076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,8,power_law_1.2,0.735641622543335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,8,power_law_1.2,0.8853504180908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,8,power_law_1.2,1.0434559822082519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,8,power_law_1.2,1.3897664070129394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,8,power_law_1.2,1.885798454284668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,64,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,64,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,64,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,8,power_law_1.2,1.5441920280456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,64,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,64,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,64,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,64,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,64,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,64,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,64,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,64,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,64,power_law_1.01,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,64,power_law_1.01,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,64,power_law_1.01,0.12717440128326415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,64,power_law_1.01,0.2041856050491333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,64,power_law_1.01,0.3229696035385132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,64,power_law_1.01,0.44011521339416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,64,power_law_1.01,0.6842368125915528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,64,power_law_1.01,0.9177087783813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,8,power_law_1.2,1.884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,8,power_law_1.2,2.975948715209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,8,power_law_1.2,3.952025604248047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,8,power_law_1.2,5.9500480651855465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,8,power_law_1.2,3.3335296630859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,1,power_law_1.2,0.3319808006286621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,1,power_law_1.2,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,1,power_law_1.2,1.0317824363708497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,1,power_law_1.2,2.0197376251220702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,1,power_law_1.2,3.2931838989257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,1,power_law_1.2,4.668211364746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,1,power_law_1.2,5.311283111572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,1,power_law_1.2,7.632281494140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,1,power_law_1.2,7.909990692138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,1,power_law_1.2,8.430585479736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,1,power_law_1.2,8.676351928710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,1,power_law_1.2,8.981298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,1,power_law_1.2,9.274982452392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,1,power_law_1.2,9.698713684082032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,1,power_law_1.2,9.895116424560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,1,power_law_1.2,10.403225708007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,1,power_law_1.2,10.508493041992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,1,power_law_1.2,11.131699371337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,1,balanced,0.4358826478322347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,1,balanced,0.831658681233724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,1,balanced,1.4621013005574544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,1,balanced,2.861226717631022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,1,power_law_1.2,11.632006072998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,1,balanced,5.576874415079753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,1,balanced,8.201215744018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,1,power_law_1.2,12.582911682128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,8,power_law_1.2,7.2196098327636715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,8,power_law_1.2,4.327014541625976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,1,balanced,8.236714680989584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,1,balanced,8.26692263285319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,1,power_law_1.2,13.330636596679687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,1,balanced,8.299850463867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,1,balanced,8.34065055847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,1,balanced,8.390656153361002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,1,power_law_1.2,14.343577575683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,1,balanced,8.446634928385416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,1,balanced,8.502101262410482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,1,power_law_1.2,15.571136474609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,1,balanced,8.612351735432943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,1,balanced,8.710314432779947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,1,power_law_1.2,18.652774047851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,1,balanced,8.80793571472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,1,balanced,9.004373550415039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,1,balanced,9.688746770222982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,1,power_law_1.2,21.244313049316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,1,balanced,9.897130966186523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,1,balanced,10.519381205240885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,1,balanced,10.6693967183431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,1,power_law_1.2,27.578982543945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,1,balanced,12.03012212117513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,1,balanced,13.33026123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,4,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,4,balanced,0.0422986646493276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,4,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,4,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,4,balanced,0.07150933146476746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,4,balanced,0.20411733786265054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,4,balanced,0.20684800545374551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,4,balanced,0.20821332931518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,4,balanced,0.21093332767486572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,4,balanced,0.2121386726697286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,4,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,4,balanced,0.22218134005864462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,4,balanced,0.2249386707941691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,4,balanced,0.23432532946268717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,4,balanced,0.24472000201543173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,4,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,1,balanced,16.606549580891926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,4,balanced,0.26945600907007855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,4,balanced,0.30668799082438153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,1,power_law_1.2,32.35921936035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,4,balanced,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,4,balanced,0.38365332285563153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,4,balanced,0.4459520181020101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,4,balanced,0.6171306769053141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,4,balanced,0.7980373700459799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,4,balanced,1.2741973400115967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,4,balanced,1.765717347462972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,1,balanced,20.048725128173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,4,balanced,2.708650588989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,64,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,4,balanced,3.6309334437052407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,64,power_law_1.2,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,64,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,64,power_law_1.2,0.02250880002975464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,64,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,64,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,64,power_law_1.2,0.02743679881095886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,64,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,64,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,1,balanced,26.590037027994793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,64,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,64,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,64,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,64,power_law_1.2,0.04402559995651245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,64,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,64,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,64,power_law_1.2,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,64,power_law_1.2,0.15175679922103882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,64,power_law_1.2,0.159334397315979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,64,power_law_1.2,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,64,power_law_1.2,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,1,balanced,33.94542948404948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,64,power_law_1.2,0.5547776222229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,64,power_law_1.2,0.6041408061981202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,64,power_law_1.2,1.0217151641845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,64,power_law_1.2,1.4247615814208985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,1,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,1,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,1,power_law_1.2,0.0657151997089386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,1,power_law_1.2,0.12615679502487182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,1,power_law_1.2,0.24021759033203124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,1,power_law_1.2,0.341811203956604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,1,power_law_1.2,0.39813120365142823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,1,power_law_1.2,0.5369855880737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,1,power_law_1.2,0.5777408123016358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,1,power_law_1.2,0.5953536033630371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,1,power_law_1.2,0.6512639999389649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,1,power_law_1.2,0.6751935958862305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,1,power_law_1.2,0.7165952205657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,1,power_law_1.2,0.7632895946502686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,1,power_law_1.2,0.8079168319702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,1,power_law_1.2,0.8300543785095215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,1,power_law_1.2,0.9422847747802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,1,power_law_1.2,1.0962944030761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,1,power_law_1.2,1.264025592803955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,1,power_law_1.2,1.6220159530639648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,1,power_law_1.2,1.984716796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,1,power_law_1.2,2.6671104431152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,1,power_law_1.2,3.332915115356445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,1,power_law_1.2,4.754636764526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,1,power_law_1.2,6.215475082397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,1,power_law_1.2,9.259212493896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,1,power_law_1.2,12.310323333740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,8,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,8,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,8,balanced,0.2759573260943095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,8,balanced,0.5428906679153442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,8,balanced,1.03492267926534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,8,balanced,2.037930647532145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,8,balanced,3.027455965677897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,8,balanced,3.0122667948404946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,8,balanced,3.0184106826782227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,16,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,8,balanced,3.0167039235432944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,16,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,16,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,8,balanced,3.0271145502726235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,16,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,16,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,8,balanced,3.03496519724528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,16,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,16,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,8,balanced,3.0431572596232095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,16,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,16,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,8,balanced,3.0571521123250327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,16,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,16,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,8,balanced,3.074730555216471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,16,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,16,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,8,balanced,3.0813865661621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,16,power_law_1.2,0.058143997192382814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,16,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,16,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,8,balanced,3.1102078755696616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,16,power_law_1.2,0.07127040028572082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,16,power_law_1.2,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,8,balanced,3.170986811319987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,16,power_law_1.2,0.11857919692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,16,power_law_1.2,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,8,balanced,3.2843093872070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,16,power_law_1.2,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,16,power_law_1.2,0.4341760158538818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,8,balanced,3.3802239100138345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,16,power_law_1.2,0.6340608119964599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,8,balanced,3.4604320526123047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,16,power_law_1.2,0.8951807975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,8,balanced,3.6270081202189126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,16,power_law_1.2,1.3885439872741698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,8,balanced,4.174160003662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,16,power_law_1.2,2.533580780029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,8,balanced,4.222437222798665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,16,power_law_1.2,3.722035217285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,8,balanced,4.4282881418863935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,8,balanced,5.518677393595378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,8,balanced,6.174549102783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,8,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,8,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,8,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,8,power_law_1.2,0.20826239585876466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,8,power_law_1.2,0.2437119960784912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,8,power_law_1.2,0.17898240089416503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,8,power_law_1.2,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,8,power_law_1.2,0.2742271900177002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,8,power_law_1.2,0.2766848087310791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,8,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,8,power_law_1.2,0.2541568040847778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,8,power_law_1.2,0.2654207944869995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,8,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,8,power_law_1.2,0.30801920890808104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,8,power_law_1.2,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,8,power_law_1.2,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,8,power_law_1.2,0.3495935916900635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,8,power_law_1.2,0.3889152050018311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,8,power_law_1.2,0.41349120140075685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,8,power_law_1.2,0.48762879371643064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,8,power_law_1.2,0.5646336078643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,8,power_law_1.2,0.7464960098266602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,8,power_law_1.2,0.9854975700378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,8,power_law_1.2,1.4110719680786132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,8,power_law_1.2,2.0756479263305665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,8,power_law_1.2,3.161702346801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,8,power_law_1.2,4.04582405090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,2,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,2,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,2,power_law_1.2,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,2,power_law_1.2,0.15851520299911498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,2,power_law_1.2,0.19435520172119142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,2,power_law_1.2,0.3905535936355591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,2,power_law_1.2,0.41553921699523927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,2,power_law_1.2,0.4216832160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,2,power_law_1.2,0.4562943935394287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,2,power_law_1.2,0.4616191864013672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,2,power_law_1.2,0.4710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,2,power_law_1.2,0.4808703899383545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.4065279960632324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,2,power_law_1.2,0.4704256057739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.6070271968841553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,2,power_law_1.2,0.4788224220275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,1,power_law_1.2,1.0117119789123534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,1,power_law_1.2,1.0071935653686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,1,power_law_1.2,1.045299243927002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,1,power_law_1.2,1.0686464309692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,2,power_law_1.2,0.5105663776397705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,1,power_law_1.2,1.0713088035583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,2,power_law_1.2,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,1,power_law_1.2,1.0754048347473144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,2,power_law_1.2,0.5421055793762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,1,power_law_1.2,1.1003904342651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,2,power_law_1.2,0.6229951858520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,1,power_law_1.2,1.0858304023742675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,2,power_law_1.2,0.6428607940673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,1,power_law_1.2,1.1393024444580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,2,power_law_1.2,0.8167424201965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,1,power_law_1.2,1.1591679573059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,2,power_law_1.2,1.0442751884460448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,1,power_law_1.2,1.224499225616455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,1,power_law_1.2,1.286348819732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,1,power_law_1.2,1.344102382659912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,2,power_law_1.2,1.3789183616638183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,1,power_law_1.2,1.357414436340332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,1,power_law_1.2,1.5964159965515137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,1,power_law_1.2,1.7739776611328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,2,power_law_1.2,1.6416767120361329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,1,power_law_1.2,2.250137519836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,2,power_law_1.2,2.4580095291137694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,2,power_law_1.2,2.8033023834228517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,1,power_law_1.2,2.688409614562988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,1,power_law_1.2,3.6395008087158205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,1,power_law_1.01,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,1,power_law_1.01,0.3942399978637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,1,power_law_1.01,0.49991679191589355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,1,power_law_1.01,0.8787967681884765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,1,power_law_1.01,0.881868839263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,1,power_law_1.01,0.8886272430419921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,1,power_law_1.01,0.8951807975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,1,power_law_1.01,0.8998911857604981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,1,power_law_1.01,0.8832832336425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,1,power_law_1.01,0.9254912376403809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,1,power_law_1.01,0.9377792358398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,1,power_law_1.2,4.620902252197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,1,power_law_1.01,0.88985595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,1,power_law_1.01,0.9809920310974121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,1,power_law_1.01,1.0080256462097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,1,power_law_1.01,1.0743807792663573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,1,power_law_1.01,1.1200511932373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,1,power_law_1.01,1.203609561920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,2,power_law_1.2,4.174028778076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,1,power_law_1.01,1.3885439872741698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,1,power_law_1.01,1.5898624420166017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,1,power_law_1.01,1.9711999893188477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,1,power_law_1.01,2.40762882232666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,1,power_law_1.01,3.3384449005126955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,1,power_law_1.01,4.195123291015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,1,power_law_1.2,6.0368896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,32,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,32,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,32,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,32,balanced,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,32,balanced,0.2860373258590698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,32,balanced,0.5435733397801717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,32,balanced,0.791541337966919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,32,balanced,0.7942826747894287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,32,balanced,0.7944533030192057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,32,balanced,0.7965013186136881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,32,balanced,0.8000799814860026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,32,balanced,0.803669293721517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,32,balanced,0.8046933015187582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,32,balanced,0.8106666405995687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,32,balanced,0.8171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,32,balanced,0.8193706671396891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,32,balanced,0.8314879735310873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,32,balanced,0.8509439627329508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,32,balanced,0.8750080267588297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,32,balanced,0.9067520300547282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,32,balanced,0.9760426680246989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,32,balanced,1.0548906326293945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,32,balanced,1.0982133547465007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,32,balanced,1.2414240042368572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,32,balanced,1.4798506100972493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,32,balanced,1.9305814107259114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,32,balanced,2.4818239212036133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,1,power_law_1.01,5.976652908325195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,2,power_law_1.2,5.728460693359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,1,power_law_1.01,7.831142425537109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,1,power_law_1.01,11.242086029052734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,1,power_law_1.2,7.90118408203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,1,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,1,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,1,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,1,power_law_1.01,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,1,power_law_1.01,0.22526719570159912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,1,power_law_1.01,0.30208001136779783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,1,power_law_1.01,0.41697278022766116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,1,power_law_1.01,0.43683838844299316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,1,power_law_1.01,0.44646401405334474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,1,power_law_1.01,0.47656960487365724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,1,power_law_1.01,0.49111042022705076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,1,power_law_1.01,0.5195775985717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,1,power_law_1.01,0.5404672145843505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,1,power_law_1.01,0.582041597366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,1,power_law_1.01,0.6203392028808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,1,power_law_1.01,0.6477439880371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,1,power_law_1.01,0.734822416305542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,1,power_law_1.01,0.8790016174316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,1,power_law_1.01,1.0614784240722657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,1,power_law_1.01,1.399193572998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,1,power_law_1.01,1.7367040634155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,1,power_law_1.01,2.4059776306152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,1,power_law_1.01,3.058278465270996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,1,power_law_1.01,4.440473556518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,1,power_law_1.01,5.916876983642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,1,power_law_1.01,8.873779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,1,power_law_1.01,11.816140747070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,1,power_law_1.01,14.997299194335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,1,power_law_1.2,11.347148895263672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,1,power_law_1.2,14.554521179199218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,16,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,16,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,16,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,16,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,16,balanced,0.047413334250450134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,16,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,16,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,16,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,16,balanced,0.059546664357185364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,16,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,16,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,16,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,16,balanced,0.06348800162474315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,16,balanced,0.0747519979874293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,16,balanced,0.10939733187357585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,16,balanced,0.13004799683888754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,16,balanced,0.19473065932591757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,16,balanced,0.22169599930445352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,16,balanced,0.2474666635195414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,16,balanced,0.2935466567675273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,16,balanced,0.3413333495457967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,16,balanced,0.4222293297449748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,16,balanced,0.5195093154907227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,16,balanced,0.7570772965749105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,16,balanced,1.002837340037028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,16,balanced,1.5131306648254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,16,balanced,2.045952002207438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,2,power_law_1.01,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,2,power_law_1.01,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,2,power_law_1.01,0.27831039428710935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,2,power_law_1.01,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,2,power_law_1.01,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,2,power_law_1.01,0.4753407955169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,2,power_law_1.01,0.47861762046813966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,2,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,2,power_law_1.01,0.4966400146484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,2,power_law_1.01,0.5191679954528808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,2,power_law_1.01,0.5158912181854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,2,power_law_1.01,0.5259263992309571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,2,power_law_1.01,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,2,power_law_1.01,0.5873663902282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,2,power_law_1.01,0.5574656009674073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,2,power_law_1.01,0.6199295997619629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,2,power_law_1.01,0.6762495994567871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,2,power_law_1.01,0.8755200386047364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,2,power_law_1.01,0.840294361114502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,2,power_law_1.01,1.1610112190246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,2,power_law_1.01,1.7154048919677733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,2,power_law_1.01,2.0353023529052736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,2,power_law_1.01,0.33075199127197263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,2,power_law_1.01,2.675916862487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,2,power_law_1.01,0.5472256183624268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,2,power_law_1.01,0.8071167945861817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,2,power_law_1.01,1.3510656356811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,2,power_law_1.01,1.8423807144165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,2,power_law_1.01,2.332876777648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,2,power_law_1.01,2.9071359634399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,2,power_law_1.01,3.1492095947265626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,2,power_law_1.01,3.1901567459106444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,2,power_law_1.01,3.2176128387451173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,2,power_law_1.01,3.461119842529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,2,power_law_1.01,3.411763381958008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,2,power_law_1.01,3.501875305175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,2,power_law_1.01,3.7312511444091796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,2,power_law_1.01,3.701753616333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,2,power_law_1.01,3.8397953033447267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,2,power_law_1.01,3.9299072265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,2,power_law_1.01,4.029030227661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,2,power_law_1.01,4.176691055297852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,2,power_law_1.01,4.485318374633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,2,power_law_1.01,4.795187377929688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,2,power_law_1.01,5.257215881347657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,2,power_law_1.01,5.987942504882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,2,power_law_1.01,4.382720184326172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,2,power_law_1.01,7.549747467041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,2,power_law_1.01,8.996659088134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,2,power_law_1.01,12.831333923339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,2,power_law_1.01,14.507008361816407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,128,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,128,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,128,power_law_1.01,0.02805120050907135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,128,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,128,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,128,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,128,power_law_1.01,0.029875200986862183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,128,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,128,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,128,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,128,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,128,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,128,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,128,power_law_1.01,0.032742398977279666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,128,power_law_1.01,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,128,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,128,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,128,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,128,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,128,power_law_1.01,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,128,power_law_1.01,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,128,power_law_1.01,0.1282047986984253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,128,power_law_1.01,0.17571840286254883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,128,power_law_1.01,0.33648641109466554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,128,power_law_1.01,0.4777984142303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,128,power_law_1.01,0.6899328231811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,128,power_law_1.01,0.9569919586181641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,2,power_law_1.01,4.823027038574219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,2,power_law_1.01,7.811686706542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,2,power_law_1.01,8.876236724853516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,4,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,4,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,4,power_law_1.2,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,4,power_law_1.2,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,4,power_law_1.2,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,4,power_law_1.2,0.3358720064163208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,4,power_law_1.2,0.33505280017852784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,4,power_law_1.2,0.32071681022644044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,4,power_law_1.2,0.35246078968048095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,4,power_law_1.2,0.3680255889892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,4,power_law_1.2,0.36964480876922606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,4,power_law_1.2,0.3926016092300415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,4,power_law_1.2,0.38727679252624514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,32,power_law_1.2,0.04053759872913361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,4,power_law_1.2,0.394649600982666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,32,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,4,power_law_1.2,0.42700800895690916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,32,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,4,power_law_1.2,0.42104320526123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,32,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,4,power_law_1.2,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,32,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,4,power_law_1.2,0.5093376159667968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,32,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,4,power_law_1.2,0.5441535949707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,32,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,4,power_law_1.2,0.6805503845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,32,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,32,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,4,power_law_1.2,0.829644775390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,32,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,32,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,4,power_law_1.2,1.1579392433166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,32,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,32,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,4,power_law_1.2,1.3141823768615724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,32,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,32,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,32,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,32,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,32,power_law_1.2,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,4,power_law_1.2,1.9396608352661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,32,power_law_1.2,0.0997376024723053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,32,power_law_1.2,0.12738560438156127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,32,power_law_1.2,0.17653759717941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,4,power_law_1.2,2.4569664001464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,32,power_law_1.2,0.27913599014282225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,32,power_law_1.2,0.293887996673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,32,power_law_1.2,0.4321280002593994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,32,power_law_1.2,0.6541312217712403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,32,power_law_1.2,1.0156031608581544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,32,power_law_1.2,1.519820785522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,4,power_law_1.2,3.6380672454833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,4,power_law_1.2,4.9438526153564455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,32,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,32,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,32,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,32,power_law_1.2,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,32,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,32,power_law_1.2,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,32,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,32,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,32,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,32,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,32,power_law_1.2,0.060198402404785155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,32,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,32,power_law_1.2,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,32,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,32,power_law_1.2,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,32,power_law_1.2,0.10649600028991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,32,power_law_1.2,0.16117759943008422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,32,power_law_1.2,0.21032319068908692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,32,power_law_1.2,0.2559999942779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,32,power_law_1.2,0.3037184000015259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,32,power_law_1.2,0.35082240104675294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,32,power_law_1.2,0.4909056186676025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,32,power_law_1.2,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,32,power_law_1.2,0.9549823760986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,32,power_law_1.2,1.2120063781738282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,32,power_law_1.2,2.1710847854614257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,64,balanced,0.02065066620707512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,64,balanced,0.02164799968401591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,64,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,64,balanced,0.020309332758188248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,64,balanced,0.02065066620707512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,64,balanced,0.021674667795499165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,64,balanced,0.021674667795499165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,64,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,32,power_law_1.2,2.6357759475708007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,64,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,64,balanced,0.02235200007756551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,64,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,64,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,64,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,64,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,64,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,64,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,64,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,64,balanced,0.03071466585000356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,64,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,64,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,64,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,64,balanced,0.04675200084845225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,64,balanced,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,64,balanced,0.07133866846561432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,64,balanced,0.1358506679534912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,64,balanced,0.20616533358891806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,4,power_law_1.2,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,4,power_law_1.2,0.5259263992309571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,4,power_law_1.2,0.7063551902770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,4,power_law_1.2,1.0584063529968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,4,power_law_1.2,1.080934429168701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,4,power_law_1.2,1.5155200004577636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,4,power_law_1.2,1.6095232009887694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,4,power_law_1.2,1.5923199653625488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,4,power_law_1.2,1.6967679977416992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,4,power_law_1.2,1.6861183166503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,4,power_law_1.2,1.7332223892211913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,4,power_law_1.2,1.680588722229004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,4,power_law_1.2,1.8137088775634767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,4,power_law_1.2,1.8526208877563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,4,power_law_1.2,1.864499282836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,4,power_law_1.2,1.841971206665039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,4,power_law_1.2,1.9093503952026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,4,power_law_1.2,2.0322303771972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,4,power_law_1.2,2.2001663208007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,4,power_law_1.2,2.6861568450927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,4,power_law_1.2,3.1080448150634767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,4,power_law_1.2,4.1412609100341795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,4,power_law_1.2,3.735756683349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.07454720139503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.5428864002227783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,1,power_law_1.2,1.0356736183166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,1,power_law_1.2,1.6519168853759765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,1,power_law_1.2,2.371993637084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,1,power_law_1.2,2.802892875671387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,1,power_law_1.2,3.9215103149414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,1,power_law_1.2,4.116479873657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,4,power_law_1.2,6.2130176544189455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,1,power_law_1.2,4.214988708496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,1,power_law_1.2,4.511129760742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,1,power_law_1.2,4.677836990356445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,1,power_law_1.2,4.868505477905273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,1,power_law_1.2,5.017804718017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,1,power_law_1.2,5.251891326904297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,1,power_law_1.2,5.414502334594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,1,power_law_1.2,5.637113571166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,1,power_law_1.2,5.9109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,1,power_law_1.2,6.4307197570800785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,4,power_law_1.2,6.73095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,1,power_law_1.2,6.992281341552735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,1,power_law_1.2,7.7662208557128904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,1,power_law_1.2,8.840383911132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,1,power_law_1.2,9.73883514404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,1,power_law_1.2,12.166758728027343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,1,power_law_1.2,14.009344482421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,1,power_law_1.2,18.870681762695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,8,power_law_1.01,0.3811327934265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,8,power_law_1.01,0.6897664070129395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,8,power_law_1.01,0.7944191932678223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,8,power_law_1.01,0.9541631698608398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,1,power_law_1.2,22.243501281738283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,8,power_law_1.01,0.9789440155029296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,8,power_law_1.01,0.941260814666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,8,power_law_1.01,1.1397120475769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,8,power_law_1.01,1.1491328239440919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,8,power_law_1.01,1.1522047996520997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,8,power_law_1.01,1.0518336296081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,8,power_law_1.01,1.1935744285583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,8,power_law_1.01,1.1034560203552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,8,power_law_1.01,1.123737621307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,8,power_law_1.01,1.2580863952636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,8,power_law_1.01,1.201356792449951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,8,power_law_1.01,1.291263961791992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,8,power_law_1.01,1.2587008476257324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,8,power_law_1.01,1.306009578704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,8,power_law_1.01,1.400217628479004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,8,power_law_1.01,1.3813759803771972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,8,power_law_1.01,1.5779840469360351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,8,power_law_1.01,1.924095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,8,power_law_1.01,2.1168127059936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,8,power_law_1.01,2.76889591217041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,8,power_law_1.01,3.0619647979736326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,4,power_law_1.2,10.273177337646484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,8,power_law_1.01,4.389068984985352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,8,power_law_1.01,5.473484802246094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,4,power_law_1.2,12.218777465820313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,16,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,16,power_law_1.2,0.15275520086288452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,16,power_law_1.2,0.07491840124130249
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,16,power_law_1.2,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,16,power_law_1.2,0.14561280012130737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,16,power_law_1.2,0.10055680274963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,16,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,16,power_law_1.2,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,16,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,16,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,16,power_law_1.2,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,16,power_law_1.2,0.10977280139923096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,16,power_law_1.2,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,16,power_law_1.2,0.15275520086288452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,16,power_law_1.2,0.15380480289459228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,16,power_law_1.2,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,16,power_law_1.2,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,16,power_law_1.2,0.19904639720916747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,16,power_law_1.2,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,16,power_law_1.2,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,16,power_law_1.2,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,16,power_law_1.2,0.3487744092941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,16,power_law_1.2,0.4108287811279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,16,power_law_1.2,0.6262784004211426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,16,power_law_1.2,0.8501248359680176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,16,power_law_1.2,1.4546943664550782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,16,power_law_1.2,2.026495933532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,8,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,8,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,8,balanced,0.2435413400332133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,8,balanced,0.4872533480326335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,8,balanced,0.8430933157602946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,8,balanced,1.0810026327768962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,8,balanced,1.0871466795603435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,8,balanced,1.0767359733581543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,8,balanced,1.0803199609120686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,8,balanced,1.0828746954600017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,8,balanced,1.089194695154826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,8,balanced,1.097215970357259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,8,balanced,1.1037013530731201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,8,balanced,1.116159995396932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,8,balanced,1.1313493251800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,8,balanced,1.1467093626658122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,8,balanced,1.1651413440704346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,8,balanced,1.1837440331776936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,8,balanced,1.2284586429595947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,8,balanced,1.3255679607391357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,8,balanced,1.4216532707214355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,8,balanced,1.6356693903605144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,8,balanced,1.8433705965677898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,8,balanced,2.32806396484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,8,balanced,2.895359992980957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,8,balanced,3.9761921564737954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,8,balanced,5.060437202453613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,32,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,32,balanced,0.02712533374627431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,32,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,32,balanced,0.027802666028340656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,32,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,32,balanced,0.030192000170548756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,32,balanced,0.03018666555484136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,32,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,32,balanced,0.030373332401116688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,32,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,32,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,32,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,32,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,32,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,32,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,32,balanced,0.03597866743803024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,32,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,32,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,32,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,32,balanced,0.07130666573842366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,32,balanced,0.18363734086354574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,32,balanced,0.2392586668332418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,32,balanced,0.34696535269419354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,32,balanced,0.4476319948832194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,32,balanced,0.701754649480184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,32,balanced,0.9328640302022299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,8,power_law_1.01,0.39933440685272215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,8,power_law_1.01,0.753868818283081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,8,power_law_1.01,0.6264832019805908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,8,power_law_1.01,0.7857855796813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,8,power_law_1.01,0.9048064231872559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,8,power_law_1.01,0.9189375877380371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,8,power_law_1.01,0.8771583557128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,8,power_law_1.01,0.8978431701660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,8,power_law_1.01,0.9733823776245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,8,power_law_1.01,0.9170944213867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,8,power_law_1.01,0.9920512199401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,8,power_law_1.01,0.9750528335571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,8,power_law_1.01,1.0256383895874024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,8,power_law_1.01,1.0080256462097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,8,power_law_1.01,1.0502143859863282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,8,power_law_1.01,1.0536959648132325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,8,power_law_1.01,1.0889216423034669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,8,power_law_1.01,1.1505663871765137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,8,power_law_1.01,1.2607295989990235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,8,power_law_1.01,1.4061375617980958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,8,power_law_1.01,1.5452159881591796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,8,power_law_1.01,1.8966527938842774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,8,power_law_1.01,2.1860095977783205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,8,power_law_1.01,2.919424057006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,8,power_law_1.01,3.419750213623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,8,power_law_1.01,5.170790481567383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,8,power_law_1.01,6.562406158447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,16,power_law_1.01,0.05219200253486633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,32,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,32,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,32,balanced,0.03549333413441976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,32,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,32,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,32,balanced,0.18978132804234824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,32,balanced,0.19080533583958945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,32,balanced,0.19165867567062378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,32,balanced,0.19234132766723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,32,balanced,0.19234132766723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,32,balanced,0.19336533546447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,32,balanced,0.19473065932591757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,32,balanced,0.1967680056889852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,32,balanced,0.1991680065790812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,32,balanced,0.20239466428756714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,32,balanced,0.20376000801722208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,16,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,32,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,32,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,16,power_law_1.01,0.04647679924964905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,32,balanced,0.22663466135660806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,32,balanced,0.23773866891860962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,16,power_law_1.01,0.04647679924964905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,32,balanced,0.2525866627693176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,16,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,32,balanced,0.28757333755493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,32,balanced,0.30822400252024335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,16,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,32,balanced,0.38707200686136883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,16,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,16,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,32,balanced,0.4106239875157674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,16,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,32,balanced,0.5937493244806925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,16,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,16,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,32,balanced,0.7541759808858236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,16,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,16,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,16,power_law_1.01,0.05813760161399841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,16,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,16,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,16,power_law_1.01,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,16,power_law_1.01,0.1060863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,16,power_law_1.01,0.13904000520706178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,16,power_law_1.01,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,16,power_law_1.01,0.2902015924453735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,16,power_law_1.01,0.4038656234741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,16,power_law_1.01,0.5627903938293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,16,power_law_1.01,0.8693759918212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,16,power_law_1.01,1.1476991653442383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,16,power_law_1.01,1.9580928802490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,16,power_law_1.01,2.641695976257324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,128,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,128,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,128,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,128,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,128,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,128,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,128,balanced,0.04760533571243286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,128,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,128,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,128,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,128,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,128,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,128,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,128,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,128,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,128,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,128,balanced,0.06229333579540253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,128,balanced,0.0766293356815974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,128,balanced,0.08362666765848796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,128,balanced,0.11724799871444702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,128,balanced,0.13260799646377563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,128,balanced,0.2686293323834737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,128,balanced,0.3078826665878296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,128,balanced,0.4128426710764567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,128,balanced,0.5106346607208252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,128,balanced,0.7686826388041178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,128,balanced,1.0117119948069255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,4,power_law_1.01,0.33402879238128663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,4,power_law_1.01,0.5134335994720459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,4,power_law_1.01,0.6057983875274658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,4,power_law_1.01,0.7612415790557862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,4,power_law_1.01,0.908902359008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,4,power_law_1.01,1.1812864303588868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,4,power_law_1.01,1.2007424354553222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,4,power_law_1.01,1.1579392433166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,4,power_law_1.01,1.2511232376098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,4,power_law_1.01,1.221836757659912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,4,power_law_1.01,1.309286403656006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,4,power_law_1.01,1.2705727577209474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,4,power_law_1.01,1.3608960151672362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,4,power_law_1.01,1.4090239524841308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,4,power_law_1.01,1.3668352127075196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,4,power_law_1.01,1.447116756439209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,4,power_law_1.01,1.4602239608764649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,4,power_law_1.01,1.5007743835449219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,4,power_law_1.01,1.6326656341552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,4,power_law_1.01,1.7870847702026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,4,power_law_1.01,1.9732479095458983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,4,power_law_1.01,2.4756095886230467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,4,power_law_1.01,2.8409856796264648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,4,power_law_1.01,4.092313766479492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,4,power_law_1.01,4.756480026245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,4,power_law_1.01,6.667059326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,32,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,32,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,32,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,32,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,32,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,32,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,32,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,32,power_law_1.2,0.0536191999912262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,32,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,32,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,32,power_law_1.2,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,4,power_law_1.01,8.180326080322265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,32,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,32,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,32,power_law_1.2,0.07188479900360108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,32,power_law_1.2,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,32,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,32,power_law_1.2,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,32,power_law_1.2,0.1265663981437683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,32,power_law_1.2,0.15400960445404052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,32,power_law_1.2,0.23367679119110107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,32,power_law_1.2,0.2760576009750366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,32,power_law_1.2,0.46284799575805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,32,power_law_1.2,0.6756351947784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,32,power_law_1.2,0.9187328338623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,32,power_law_1.2,1.3783040046691895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,1,power_law_1.01,1.4493696212768554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,1,power_law_1.01,2.830745506286621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,1,power_law_1.01,5.722521591186523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,1,power_law_1.01,10.133299255371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,32,power_law_1.2,2.37445125579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,1,power_law_1.01,14.02081298828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,32,power_law_1.2,2.855526351928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,1,power_law_1.01,23.644569396972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,1,power_law_1.01,25.586483764648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,1,power_law_1.01,27.230209350585938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,1,power_law_1.01,27.333004760742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,1,power_law_1.01,27.69776611328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,4,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,4,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,4,power_law_1.01,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,4,power_law_1.01,0.12431360483169555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,4,power_law_1.01,0.20049920082092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,8,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,8,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,4,power_law_1.01,0.26746881008148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,8,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,4,power_law_1.01,0.2883584022521973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,8,power_law_1.2,0.05240319967269898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,4,power_law_1.01,0.34406399726867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,8,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,4,power_law_1.01,0.35450880527496337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,4,power_law_1.01,0.32133119106292723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,4,power_law_1.01,0.35143680572509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,4,power_law_1.01,0.3530751943588257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,8,power_law_1.2,0.05813120007514953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,1,power_law_1.01,28.061285400390624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,4,power_law_1.01,0.3817471981048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,8,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,4,power_law_1.01,0.4122623920440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,8,power_law_1.2,0.058771198987960814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,4,power_law_1.01,0.3989504098892212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,8,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,4,power_law_1.01,0.40898561477661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,8,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,4,power_law_1.01,0.44359679222106935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,8,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,8,power_law_1.2,0.06653439998626709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,4,power_law_1.01,0.49786877632141113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,8,power_law_1.2,0.06959999799728393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,4,power_law_1.01,0.548857593536377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,8,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,8,power_law_1.2,0.1031999945640564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,4,power_law_1.01,0.6512639999389649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,8,power_law_1.2,0.12840960025787354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,4,power_law_1.01,0.7639039993286133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,8,power_law_1.2,0.16424959897994995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,8,power_law_1.2,0.23879680633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,4,power_law_1.01,0.9998335838317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,8,power_law_1.2,0.2693120002746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,8,power_law_1.2,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,4,power_law_1.01,1.3545472145080566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,8,power_law_1.2,0.41656317710876467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,8,power_law_1.2,0.6262784004211426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,4,power_law_1.01,1.8845695495605468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,8,power_law_1.2,0.8384511947631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,4,power_law_1.01,2.5364479064941405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,8,power_law_1.2,1.224294376373291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,1,power_law_1.01,29.138330078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,8,power_law_1.2,1.8655231475830079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,4,power_law_1.01,3.5606529235839846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,8,power_law_1.2,2.817433547973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,4,power_law_1.01,4.901478576660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,8,power_law_1.2,4.096819305419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,1,power_law_1.01,30.35914306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,1,power_law_1.01,30.801919555664064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,1,power_law_1.01,31.554763793945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,1,power_law_1.01,32.47841186523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,1,power_law_1.01,34.56839599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,8,power_law_1.01,0.0296640008687973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,8,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,8,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,8,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,8,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,8,power_law_1.01,0.030905601382255555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,8,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,8,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,8,power_law_1.01,0.033344000577926636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,8,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,8,power_law_1.01,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,8,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,8,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,8,power_law_1.01,0.04832000136375427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,8,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,8,power_law_1.01,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,1,power_law_1.01,37.044427490234376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,8,power_law_1.01,0.09687039852142335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,8,power_law_1.01,0.14476799964904785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,8,power_law_1.01,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,1,power_law_1.01,37.21830444335937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,8,power_law_1.01,0.372326397895813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,1,power_law_1.01,40.19158935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,8,power_law_1.01,0.4640768051147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,8,power_law_1.01,0.7208576202392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,1,power_law_1.01,38.570394897460936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,1,power_law_1.01,44.00005187988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,1,power_law_1.01,45.447576904296874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,8,power_law_1.01,1.1196288108825683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,1,power_law_1.01,55.303375244140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,16,power_law_1.01,0.16588799953460692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,16,power_law_1.01,0.3559423923492432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,16,power_law_1.01,0.3583872079849243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,16,power_law_1.01,0.3579904079437256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,16,power_law_1.01,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,16,power_law_1.01,0.3131392002105713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,16,power_law_1.01,0.3344383955001831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,16,power_law_1.01,0.31887359619140626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,16,power_law_1.01,0.31969280242919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,16,power_law_1.01,0.3117055892944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,16,power_law_1.01,0.30064640045166013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,16,power_law_1.01,0.3303231954574585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,16,power_law_1.01,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,16,power_law_1.01,0.3315711975097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,16,power_law_1.01,0.3604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,16,power_law_1.01,0.3436543941497803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,16,power_law_1.01,0.3407871961593628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,16,power_law_1.01,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,16,power_law_1.01,0.40816640853881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,16,power_law_1.01,0.41840639114379885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,16,power_law_1.01,0.475545597076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,16,power_law_1.01,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,16,power_law_1.01,0.7116799831390381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,16,power_law_1.01,0.9158656120300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,16,power_law_1.01,1.183743953704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,1,power_law_1.01,65.9894287109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,16,power_law_1.01,1.6103424072265624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,16,power_law_1.01,2.0025344848632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,8,power_law_1.01,1.6565887451171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,8,power_law_1.01,2.21081600189209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,1,power_law_1.01,86.37704467773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,1,power_law_1.2,0.5904384136199952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,1,power_law_1.2,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,1,power_law_1.2,2.010111999511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,1,power_law_1.01,96.813671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,1,power_law_1.2,3.9739009857177736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,1,power_law_1.2,6.31541748046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,1,power_law_1.2,8.847360229492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,1,power_law_1.2,11.020492553710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,1,power_law_1.2,15.155404663085937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,1,power_law_1.2,16.15851593017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,1,power_law_1.2,16.603123474121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,1,power_law_1.2,17.193370056152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,1,power_law_1.2,18.080152893066405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,1,power_law_1.2,18.266522216796876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,1,power_law_1.2,18.99622344970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,1,power_law_1.2,18.862693786621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,1,power_law_1.2,19.683941650390626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,8,power_law_1.01,0.8271743774414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,8,power_law_1.01,1.467801570892334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,8,power_law_1.01,1.176371192932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,8,power_law_1.01,1.5566847801208497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,8,power_law_1.01,1.82476806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,8,power_law_1.01,1.8968576431274413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,1,power_law_1.2,20.633804321289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,8,power_law_1.01,1.6642047882080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,8,power_law_1.01,1.8569215774536132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,8,power_law_1.01,1.864089584350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,8,power_law_1.01,1.7713151931762696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,8,power_law_1.01,1.8397184371948243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,8,power_law_1.01,1.9341312408447267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,8,power_law_1.01,1.9357440948486329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,8,power_law_1.01,2.0278976440429686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,1,power_law_1.2,21.604966735839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,8,power_law_1.01,2.0780799865722654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,8,power_law_1.01,2.0938751220703127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,8,power_law_1.01,2.1331968307495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,8,power_law_1.01,2.1571584701538087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,8,power_law_1.01,2.247475242614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,8,power_law_1.01,2.5548799514770506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,1,power_law_1.2,22.80980529785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,8,power_law_1.01,2.8448768615722657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,8,power_law_1.01,3.544473648071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,8,power_law_1.01,3.471974563598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,8,power_law_1.01,4.691558456420898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,1,power_law_1.2,24.097152709960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,8,power_law_1.01,5.417350387573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,8,power_law_1.01,7.831552124023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,1,power_law_1.2,25.745819091796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,8,power_law_1.01,9.629901123046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,1,power_law_1.2,28.082382202148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,1,power_law_1.2,30.014431762695313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,1,power_law_1.2,35.140814208984374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,1,power_law_1.2,40.182168579101564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,4,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,4,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,4,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,4,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,4,balanced,0.038389332592487335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,4,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,4,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,4,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,4,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,4,balanced,0.04078399886687597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,4,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,4,balanced,0.053413331508636475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,4,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,4,balanced,0.06673066814740498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,4,balanced,0.08550399541854858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,4,balanced,0.08772266904513042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,4,balanced,0.11588266491889954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,4,balanced,0.16895999511082968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,4,balanced,0.21076265970865884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,4,balanced,0.2583893338839213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,4,balanced,0.3218773404757182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,4,balanced,0.4729173183441162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,4,balanced,0.6299306551615397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,4,balanced,0.9335467020670573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,4,balanced,1.285802682240804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,4,balanced,2.0171093940734863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,4,balanced,2.747904141743978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,1,power_law_1.2,50.98147888183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,64,power_law_1.2,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,64,power_law_1.2,0.020262399315834047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,64,power_law_1.2,0.019251200556755065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,64,power_law_1.2,0.01945600062608719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,64,power_law_1.2,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,64,power_law_1.2,0.020684799551963805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,64,power_law_1.2,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,64,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,64,power_law_1.2,0.024979199469089507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,64,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,64,power_law_1.2,0.02619520127773285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,64,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,64,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,64,power_law_1.2,0.03930880129337311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,64,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,64,power_law_1.2,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,64,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,64,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,64,power_law_1.2,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,64,power_law_1.2,0.08273919820785522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,1,power_law_1.2,65.4403564453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,64,power_law_1.2,0.12902400493621827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,64,power_law_1.2,0.16752640008926392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,64,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,64,power_law_1.2,0.5279744148254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,8,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,8,balanced,0.05102399984995524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,8,balanced,0.06195199986298879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,8,balanced,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,8,balanced,0.28380799293518066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,8,balanced,0.2846720019976298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,8,balanced,0.285866657892863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,8,balanced,0.28757333755493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,8,balanced,0.29047467311223346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,8,balanced,0.2925173242886861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,8,balanced,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,8,balanced,0.3017386595408122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,8,balanced,0.30856533845265705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,8,balanced,0.3126613299051921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,8,balanced,0.3256319959958394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,8,balanced,0.35140268007914227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,8,balanced,0.37444265683492023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,8,balanced,0.42188799381256104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,8,balanced,0.4753066698710124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,8,balanced,0.6126933495203654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,8,balanced,0.8198826313018799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,8,balanced,1.1856213410695393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,8,balanced,1.5614293416341145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,8,balanced,2.232661406199137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,8,balanced,2.847402572631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,64,power_law_1.2,0.6795263767242432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,2,power_law_1.01,0.4268032073974609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,2,power_law_1.01,0.6541312217712403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,2,power_law_1.01,0.683622407913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,2,power_law_1.01,0.9869312286376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,2,power_law_1.01,1.0338303565979003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,2,power_law_1.01,1.041817569732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,2,power_law_1.01,1.0514431953430177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,2,power_law_1.01,1.0674176216125488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,2,power_law_1.01,1.1081727981567382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,2,power_law_1.01,1.1626496315002441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,2,power_law_1.01,1.1999232292175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,2,power_law_1.01,1.2703743934631349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,2,power_law_1.01,1.407590389251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,2,power_law_1.01,1.4028800010681153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,2,power_law_1.01,1.5576959609985352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,2,power_law_1.01,1.477017593383789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,2,power_law_1.01,1.781760025024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,2,power_law_1.01,2.1444608688354494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,16,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,16,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,16,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,16,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,16,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,2,power_law_1.01,2.528460884094238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,16,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,16,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,16,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,16,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,16,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,16,power_law_1.2,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,16,power_law_1.2,0.05795199871063232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,16,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,16,power_law_1.2,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,16,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,16,power_law_1.2,0.16752640008926392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,16,power_law_1.2,0.18862080574035645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,16,power_law_1.2,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,16,power_law_1.2,0.33812479972839354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,2,power_law_1.01,3.380633544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,16,power_law_1.2,0.6537216186523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,16,power_law_1.2,0.7878655910491943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,16,power_law_1.2,1.2283904075622558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,16,power_law_1.2,1.4606335639953614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,2,power_law_1.01,3.608371353149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,16,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,16,balanced,0.06517333288987477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,16,balanced,0.293887992699941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,16,balanced,0.5454506476720175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,16,balanced,1.0581333637237549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,16,balanced,2.0363945960998535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,16,balanced,2.042880058288574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,2,power_law_1.01,5.637529754638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,16,balanced,2.0461227099100747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,16,balanced,2.0444159507751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,16,balanced,2.0449280738830566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,16,balanced,2.0520960489908853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,16,balanced,2.056527932484945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,16,balanced,2.058922608693441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,16,balanced,2.067626635233561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,16,balanced,2.0765013694763184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,16,balanced,2.0862293243408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,16,balanced,2.1128533681233725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,16,balanced,2.188965320587158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,16,balanced,2.2237866719563804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,16,balanced,2.2604799270629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,16,balanced,2.318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,16,balanced,2.7202558517456055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,16,balanced,2.8055893580118814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,16,balanced,3.2808958689371743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,16,balanced,3.469482739766439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,16,balanced,4.250794728597005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,16,balanced,5.209941228230794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,16,power_law_1.2,0.21667840480804443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,16,power_law_1.2,0.2994175910949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,16,power_law_1.2,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,16,power_law_1.2,0.3000319957733154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,16,power_law_1.2,0.30023679733276365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,16,power_law_1.2,0.2623487949371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,16,power_law_1.2,0.28095359802246095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,16,power_law_1.2,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,16,power_law_1.2,0.2648063898086548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,16,power_law_1.2,0.28487679958343504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,2,power_law_1.01,6.4814910888671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,16,power_law_1.2,0.28813440799713136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,16,power_law_1.2,0.2942975997924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,16,power_law_1.2,0.3043328046798706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,16,power_law_1.2,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,16,power_law_1.2,0.3295232057571411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,16,power_law_1.2,0.3248127937316895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,16,power_law_1.2,0.35348479747772216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,16,power_law_1.2,0.39301118850708006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,16,power_law_1.2,0.40222721099853515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,16,power_law_1.2,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,16,power_law_1.2,0.5648384094238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,16,power_law_1.2,0.7227392196655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,16,power_law_1.2,0.9033727645874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,16,power_law_1.2,1.4196736335754394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,16,power_law_1.2,1.867366409301758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,16,power_law_1.2,2.9847551345825196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,16,power_law_1.2,3.705830383300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,2,power_law_1.01,9.616998291015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,16,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,16,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,16,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,16,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,16,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,16,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,16,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,16,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,16,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,16,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,16,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,16,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,16,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,16,power_law_1.01,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,16,power_law_1.01,0.08888319730758668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,16,power_law_1.01,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,16,power_law_1.01,0.15278079509735107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,16,power_law_1.01,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,16,power_law_1.01,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,16,power_law_1.01,0.3919872045516968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,16,power_law_1.01,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,16,power_law_1.01,0.6617087841033935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,16,power_law_1.01,1.0127360343933105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,16,power_law_1.01,1.4219264030456542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,2,power_law_1.01,11.423129272460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,2,power_law_1.01,14.672486877441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,32,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,32,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,32,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,32,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,32,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,32,power_law_1.01,0.03540480136871338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,32,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,32,power_law_1.01,0.03581439852714539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,32,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,32,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,32,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,32,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,32,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,32,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,32,power_law_1.01,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,32,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,32,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,32,power_law_1.01,0.11486719846725464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,32,power_law_1.01,0.17592320442199708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,32,power_law_1.01,0.22814719676971434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,32,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,32,power_law_1.01,0.40755200386047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,32,power_law_1.01,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,32,power_law_1.01,0.8941184043884277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,32,power_law_1.01,1.1900927543640136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,32,power_law_1.01,1.6910335540771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,32,power_law_1.01,2.4952831268310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,2,power_law_1.01,24.253439331054686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,2,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,2,balanced,0.1525759994983673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,2,balanced,0.3536213239034017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,2,balanced,0.6719146569569906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,2,balanced,1.3026986916859944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,2,balanced,2.60915199915568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,2,balanced,2.616490681966146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,2,balanced,2.625194708506266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,2,balanced,2.63372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,2,balanced,2.6419199307759604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,2,balanced,2.6064213116963706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,2,balanced,2.6210986773173013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,2,balanced,2.6338987350463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,2,balanced,2.6555733680725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,2,balanced,2.674858729044596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,2,balanced,2.693632125854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,2,balanced,2.729130744934082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,2,balanced,2.797738711039225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,2,balanced,2.8695894877115884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,2,balanced,3.023359934488932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,2,balanced,3.143850644429525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,2,balanced,3.4333012898763022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,2,balanced,3.7060267130533853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,2,balanced,4.024832089742024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,2,balanced,4.548949241638184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,2,balanced,5.7695573170979815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,2,balanced,7.2695465087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,4,power_law_1.01,0.1425279974937439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,4,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,4,power_law_1.01,0.16465920209884644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,4,power_law_1.01,0.24697599411010743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,4,power_law_1.01,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,4,power_law_1.01,0.2510848045349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,4,power_law_1.01,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,4,power_law_1.01,0.2506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,4,power_law_1.01,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,4,power_law_1.01,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,4,power_law_1.01,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,4,power_law_1.01,0.2678719997406006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,4,power_law_1.01,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,4,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,4,power_law_1.01,0.3295039892196655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,4,power_law_1.01,0.40755200386047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,4,power_law_1.01,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,4,power_law_1.01,0.5230527877807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,4,power_law_1.01,0.6004735946655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,4,power_law_1.01,0.8658944129943847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,4,power_law_1.01,1.0178560256958007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,4,power_law_1.01,1.82108154296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,4,power_law_1.01,2.6812416076660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,4,power_law_1.2,0.6074368000030518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,4,power_law_1.2,1.0463232040405273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,4,power_law_1.2,1.518182373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,4,power_law_1.2,2.086297607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,4,power_law_1.2,3.0054399490356447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,4,power_law_1.2,3.766252899169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,4,power_law_1.2,3.7564414978027343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,4,power_law_1.01,3.63006706237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,4,power_law_1.2,4.734156799316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,4,power_law_1.2,4.35077133178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,4,power_law_1.2,4.45214729309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,4,power_law_1.2,4.48614387512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,4,power_law_1.2,5.1554302215576175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,4,power_law_1.2,4.770611190795899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,4,power_law_1.2,4.986470413208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,4,power_law_1.2,5.35736312866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,4,power_law_1.2,4.854579162597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,4,power_law_1.2,5.487206268310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,4,power_law_1.2,6.101811218261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,4,power_law_1.2,5.741772842407227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,4,power_law_1.2,6.435020446777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,4,power_law_1.2,6.873907470703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,4,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,4,power_law_1.2,0.029075199365615846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,4,power_law_1.2,0.0296640008687973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,4,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,4,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,4,power_law_1.2,0.03110400140285492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,4,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,4,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,4,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,4,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,4,power_law_1.2,7.502848052978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,4,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,4,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,4,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,4,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,4,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,4,power_law_1.01,4.05852165222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,4,power_law_1.2,9.344204711914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,4,power_law_1.2,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,4,power_law_1.2,0.08970239758491516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,4,power_law_1.2,0.1265663981437683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,4,power_law_1.2,10.756095886230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,4,power_law_1.2,0.18944000005722045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,4,power_law_1.2,12.271206665039063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,4,power_law_1.2,0.2420736074447632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,4,power_law_1.2,16.288934326171876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,4,power_law_1.2,18.270413208007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,4,power_law_1.2,0.3051520109176636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,4,power_law_1.2,0.4859903812408447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,64,power_law_1.01,0.057740801572799684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,64,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,64,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,64,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,64,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,64,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,64,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,64,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,64,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,64,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,64,power_law_1.01,0.05691519975662231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,64,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,4,power_law_1.2,0.6981632232666015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,64,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,64,power_law_1.01,0.061843198537826535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,64,power_law_1.01,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,64,power_law_1.01,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,64,power_law_1.01,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,64,power_law_1.01,0.10444799661636353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,64,power_law_1.01,0.16424959897994995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,64,power_law_1.01,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,64,power_law_1.01,0.3072000026702881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,64,power_law_1.01,0.4216832160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,64,power_law_1.01,0.5171199798583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,64,power_law_1.01,0.7600128173828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,64,power_law_1.01,1.083801555633545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,64,power_law_1.01,1.6123903274536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,64,power_law_1.01,2.25402889251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,4,power_law_1.01,6.371327972412109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,4,power_law_1.2,0.9492480278015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,4,power_law_1.01,7.929241943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,4,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,4,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,4,balanced,0.0358240008354187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,4,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,4,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,4,balanced,0.03754133234421412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,4,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,4,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,4,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,4,balanced,0.047584002216657005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,4,balanced,0.04775466521581014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,4,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,4,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,4,balanced,0.07644799848397572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,4,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,4,balanced,0.062458669145902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,4,balanced,0.08122133215268452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,4,balanced,0.09915733337402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,4,balanced,0.11673600474993388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,4,balanced,0.144896000623703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,4,balanced,0.2757973273595174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,4,balanced,0.3461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,4,balanced,0.5725866556167603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,4,balanced,0.7930880387624105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,4,balanced,1.2357973257700603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,4,balanced,1.6831146876017253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,4,power_law_1.2,1.5855615615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,8,power_law_1.01,0.8976384162902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,8,power_law_1.01,0.8986623764038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,8,power_law_1.01,0.8990592002868653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,8,power_law_1.01,0.9007103919982911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,8,power_law_1.01,0.9048064231872559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,8,power_law_1.01,0.9261055946350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,8,power_law_1.01,1.1665408134460449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,8,power_law_1.01,1.5247296333312987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,8,power_law_1.01,1.802239990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,8,power_law_1.01,2.0731903076171876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,8,power_law_1.01,1.724006462097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,8,power_law_1.01,2.071142387390137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,8,power_law_1.01,2.531532859802246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,8,power_law_1.01,2.5044992446899412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,8,power_law_1.01,3.3853439331054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,8,power_law_1.01,4.230553436279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,8,power_law_1.01,4.465663909912109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,8,power_law_1.01,7.817401885986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,4,power_law_1.2,2.0545536041259767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,8,power_law_1.01,9.195110321044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,8,power_law_1.01,14.502297973632812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,8,power_law_1.01,16.99471435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,8,power_law_1.01,21.38275909423828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,1,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,1,balanced,0.08516266942024231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,1,balanced,0.3089066743850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,1,balanced,0.5775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,1,balanced,1.1060907046000164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,1,balanced,1.366528034210205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,1,balanced,1.3771093686421711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,1,balanced,1.3863253593444824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,1,balanced,1.3977600733439128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,1,balanced,1.405610720316569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,1,balanced,1.423866589864095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,1,balanced,1.4438400268554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,1,balanced,1.460565408070882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,1,balanced,1.497429370880127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,1,balanced,1.5348052978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,8,power_law_1.01,26.365951538085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,1,balanced,1.5701227188110352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,1,balanced,1.6370347340901692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,1,balanced,1.7631573677062988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,1,balanced,1.904981295267741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,1,balanced,2.2277119954427085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,1,balanced,2.518357276916504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,1,balanced,3.162794748942057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,1,balanced,3.67411200205485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,1,balanced,4.875434557596843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,1,balanced,6.221312204996745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,1,balanced,9.048746744791666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,1,balanced,11.715754191080729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,8,power_law_1.01,33.1905029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,8,power_law_1.01,39.15182189941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,4,power_law_1.2,3.284377670288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,8,power_law_1.01,48.789913940429685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,8,power_law_1.01,64.1333251953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,16,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,16,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,16,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,16,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,16,power_law_1.01,0.030675199627876282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,16,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,16,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,16,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,16,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,16,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,16,power_law_1.01,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,16,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,16,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,16,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,16,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,16,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,16,power_law_1.01,0.07310720086097718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,16,power_law_1.01,0.10301439762115479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,16,power_law_1.01,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,16,power_law_1.01,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,16,power_law_1.01,0.3827712059020996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,16,power_law_1.01,0.5822463989257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,16,power_law_1.01,0.6940671920776367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,16,power_law_1.01,1.2843008041381836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,16,power_law_1.01,1.7668096542358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,32,power_law_1.01,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,32,power_law_1.01,0.41635842323303224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,32,power_law_1.01,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,32,power_law_1.01,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,32,power_law_1.01,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,32,power_law_1.01,0.36474881172180174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,32,power_law_1.01,0.33361918926239015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,32,power_law_1.01,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,32,power_law_1.01,0.37396481037139895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,32,power_law_1.01,0.34508800506591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,32,power_law_1.01,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,32,power_law_1.01,0.3710911989212036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,32,power_law_1.01,0.3768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,32,power_law_1.01,0.4014080047607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,32,power_law_1.01,0.4087679862976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,32,power_law_1.01,0.39669759273529054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,32,power_law_1.01,0.42987518310546874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,32,power_law_1.01,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,32,power_law_1.01,0.46694397926330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,32,power_law_1.01,0.4759552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,32,power_law_1.01,0.5576704025268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,32,power_law_1.01,0.7202752113342286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,32,power_law_1.01,0.8474623680114746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,32,power_law_1.01,1.2324864387512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,32,power_law_1.01,1.6080896377563476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,32,power_law_1.01,2.5554943084716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,32,power_law_1.01,3.3011711120605467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,2,power_law_1.2,1.6211904525756835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,2,power_law_1.2,2.371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,2,power_law_1.2,2.8958719253540037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,2,power_law_1.2,3.5698688507080076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,2,power_law_1.2,3.4981758117675783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,2,power_law_1.2,3.564543914794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,4,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,4,balanced,0.24371200799942017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,4,balanced,0.47325865427652997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,4,balanced,0.7623679637908936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,4,balanced,1.0624000231424968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,4,balanced,1.0683733622233074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,4,balanced,1.0733226935068767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,4,balanced,1.0801493326822917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,2,power_law_1.2,3.995443344116211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,4,balanced,1.0860906442006428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,4,balanced,1.0953386624654133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,4,balanced,1.108138640721639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,4,balanced,1.117184003194173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,2,power_law_1.2,4.344217681884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,4,balanced,1.13919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,4,balanced,1.157802661259969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,4,balanced,1.1764053503672283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,2,power_law_1.2,4.874444961547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,4,balanced,1.2147893110911052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,4,balanced,1.2745386759440105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,4,balanced,1.3503146171569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,4,balanced,1.530197302500407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,2,power_law_1.2,5.114470291137695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,4,balanced,1.6965972582499187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,4,balanced,2.019498666127523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,2,power_law_1.2,4.723097610473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,4,balanced,2.4041813214619956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,2,power_law_1.2,5.530214309692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,4,balanced,3.255807876586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,4,balanced,4.0589494705200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,2,power_law_1.2,5.733171081542968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,4,balanced,5.842927932739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,2,power_law_1.2,6.903603363037109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,4,balanced,7.559338887532552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,2,power_law_1.2,6.996787261962891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,2,power_law_1.2,8.573951721191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,2,power_law_1.2,9.73311996459961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,2,power_law_1.2,12.60789794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,2,power_law_1.2,15.679283142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,8,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,8,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,8,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,8,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,8,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,8,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,8,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,8,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,8,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,8,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,8,balanced,0.03565333286921183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,8,balanced,0.03615466753641764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,8,balanced,0.036506667733192444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,8,balanced,0.060405333836873375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,8,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,8,balanced,0.10308266679445903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,8,balanced,0.15172266960144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,8,balanced,0.20548266172409058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,8,balanced,0.22749867041905722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,8,balanced,0.29337600866953534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,8,balanced,0.35923198858896893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,8,balanced,0.5983573198318481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,8,balanced,0.7795999844868978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,2,power_law_1.2,19.46050567626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,2,power_law_1.2,26.870785522460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,2,power_law_1.2,27.772723388671874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,2,power_law_1.2,39.30071105957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,2,power_law_1.2,41.200436401367185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,1,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,1,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,1,power_law_1.01,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,1,power_law_1.01,0.1685439944267273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,1,power_law_1.01,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,1,power_law_1.01,0.35614719390869143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,1,power_law_1.01,0.4982783794403076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,1,power_law_1.01,0.521830415725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,1,power_law_1.01,0.5396480083465576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,1,power_law_1.01,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,1,power_law_1.01,0.5945343971252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,1,power_law_1.01,0.6160384178161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,1,power_law_1.01,0.6400000095367432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,1,power_law_1.01,0.6563839912414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,2,power_law_1.2,60.9470458984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,1,power_law_1.01,0.6682623863220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,1,power_law_1.01,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,1,power_law_1.01,0.7444479942321778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,1,power_law_1.01,0.8316927909851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,1,power_law_1.01,0.9064448356628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,1,power_law_1.01,1.1071488380432128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,1,power_law_1.01,1.2775424003601075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,1,power_law_1.01,1.6744447708129884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,1,power_law_1.01,2.0135936737060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,1,power_law_1.01,2.799001693725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,1,power_law_1.01,3.6124671936035155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,8,power_law_1.2,1.12107515335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,1,power_law_1.01,5.322751998901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,8,power_law_1.2,2.004377555847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,8,power_law_1.2,2.086905670166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,8,power_law_1.2,2.388991928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,1,power_law_1.01,6.9607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,8,power_law_1.2,3.2454654693603517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,8,power_law_1.2,2.4207359313964845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,8,power_law_1.2,3.930073547363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,8,power_law_1.2,3.2452606201171874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,8,power_law_1.2,3.2991233825683595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,8,power_law_1.2,3.4230270385742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,8,power_law_1.2,3.4772926330566407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,8,power_law_1.2,3.8207489013671876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,8,power_law_1.2,3.4936832427978515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,8,power_law_1.2,3.744358444213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,8,power_law_1.2,3.786111831665039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,8,power_law_1.2,4.006911849975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,256,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,8,power_law_1.2,4.209868621826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,256,power_law_1.01,0.07454720139503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,256,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,256,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,8,power_law_1.2,4.29854736328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,256,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,256,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,256,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,8,power_law_1.2,4.599788665771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,256,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,256,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,256,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,256,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,256,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,8,power_law_1.2,4.969062423706054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,256,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,256,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,256,power_law_1.01,0.09748479723930359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,256,power_law_1.01,0.10219520330429077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,256,power_law_1.01,0.1423359990119934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,8,power_law_1.2,5.5339008331298825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,256,power_law_1.01,0.17326079607009887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,256,power_law_1.01,0.23265280723571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,256,power_law_1.01,0.35942399501800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,8,power_law_1.2,6.385459136962891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,256,power_law_1.01,0.36515839099884034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,256,power_law_1.01,0.5189568042755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,256,power_law_1.01,0.5992447853088378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,8,power_law_1.2,7.920230102539063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,256,power_law_1.01,1.0385343551635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,256,power_law_1.01,1.207705593109131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,256,power_law_1.01,1.9714048385620118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,8,power_law_1.2,10.275820922851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,256,power_law_1.01,2.8291072845458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,8,power_law_1.2,10.726399993896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,8,power_law_1.2,14.588517761230468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,8,power_law_1.2,17.505894470214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,2,power_law_1.2,74.016357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,4,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,4,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,4,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,4,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,4,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,4,power_law_1.2,0.04707199931144714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,4,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,4,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,4,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,4,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,4,power_law_1.2,0.05466880202293396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,4,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,4,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,4,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,4,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,4,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,4,power_law_1.2,0.07475200295448303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,4,power_law_1.2,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,4,power_law_1.2,0.11425280570983887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,4,power_law_1.2,0.19742720127105712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,4,power_law_1.2,0.2623487949371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,4,power_law_1.2,0.3586047887802124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,4,power_law_1.2,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,4,power_law_1.2,0.9111359596252442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,4,power_law_1.2,1.2848896026611327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,4,power_law_1.2,1.8130943298339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,4,power_law_1.2,2.4584192276000976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,4,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,4,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,4,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,4,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,4,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,4,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,4,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,4,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,4,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,4,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,4,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,4,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,4,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,4,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,4,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,4,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,4,power_law_1.2,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,4,power_law_1.2,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,4,power_law_1.2,0.20602879524230958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,4,power_law_1.2,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,4,power_law_1.2,0.430079984664917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,4,power_law_1.2,0.7118847846984864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,4,power_law_1.2,1.377894401550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,2,power_law_1.2,85.95558471679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,4,power_law_1.2,1.6672767639160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,2,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,2,power_law_1.01,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,2,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,2,power_law_1.01,0.35489280223846437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,2,power_law_1.01,0.5294079780578613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,2,power_law_1.01,0.7411712169647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,2,power_law_1.01,0.7739391803741456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,2,power_law_1.01,0.811622428894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,2,power_law_1.01,0.7940095901489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,2,power_law_1.01,0.8445887565612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,2,power_law_1.01,0.8554495811462403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,2,power_law_1.01,0.858521556854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,2,power_law_1.01,0.88985595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,2,power_law_1.01,0.8904704093933106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,2,power_law_1.01,0.9086976051330566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,2,power_law_1.01,0.9480192184448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,2,power_law_1.01,0.9082880020141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,2,power_law_1.01,0.9678848266601563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,2,power_law_1.01,1.0196991920471192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,2,power_law_1.01,1.1429887771606446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,2,power_law_1.01,1.2822527885437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,2,power_law_1.01,1.6506879806518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,2,power_law_1.01,1.7301248550415038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,2,power_law_1.01,2.38919677734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,4,power_law_1.2,2.6871807098388674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,2,power_law_1.01,2.8854272842407225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,2,power_law_1.01,4.40709114074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,2,power_law_1.01,5.265407943725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,4,power_law_1.2,0.9107456207275391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,4,power_law_1.2,1.2535807609558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,4,power_law_1.2,1.2494848251342774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,4,power_law_1.2,1.7764352798461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,4,power_law_1.2,1.7731584548950194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,4,power_law_1.2,1.8067455291748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,4,power_law_1.2,2.3359487533569334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,4,power_law_1.2,2.4795135498046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,4,power_law_1.2,2.6042367935180666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,4,power_law_1.2,3.3908737182617186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,4,power_law_1.2,2.9468671798706056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,4,power_law_1.2,2.5995264053344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,4,power_law_1.2,3.136102485656738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,4,power_law_1.2,3.43633918762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,4,power_law_1.2,3.713024139404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,4,power_law_1.2,4.547174453735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,4,power_law_1.2,5.9830078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,4,power_law_1.2,6.78625259399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,4,power_law_1.2,9.588121795654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,4,power_law_1.2,12.435865783691407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,4,power_law_1.2,16.169369506835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,1,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,1,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,1,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,1,balanced,0.14131200313568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,1,balanced,0.3524266481399536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,1,balanced,0.6731093724568685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,1,balanced,0.6789013544718424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,1,balanced,0.6816426912943522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,1,balanced,0.6913706461588541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,1,balanced,0.6952959696451823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,1,balanced,0.7007573445638021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,1,balanced,0.7101439634958903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,1,balanced,0.7190186977386475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,1,balanced,0.7391573588053385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,1,balanced,0.7587733268737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,1,balanced,0.7760213216145834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,1,balanced,0.8149333000183105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,1,balanced,0.8809813658396403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,1,balanced,0.9654613335927328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,1,balanced,1.1354453563690186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,4,power_law_1.2,20.790240478515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,1,balanced,1.3218133449554443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,1,balanced,1.6803840001424153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,1,balanced,2.043733278910319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,1,balanced,2.8357973098754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,1,balanced,3.6858879725138345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,1,balanced,5.391359965006511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,1,balanced,7.094271977742513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,4,power_law_1.2,24.4748291015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,32,power_law_1.2,0.6039552211761474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,32,power_law_1.2,0.5545983791351319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,32,power_law_1.2,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,32,power_law_1.2,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,32,power_law_1.2,0.5535359859466553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,32,power_law_1.2,0.5181439876556396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,32,power_law_1.2,0.4986623764038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,32,power_law_1.2,0.4996863842010498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,32,power_law_1.2,0.5339136123657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,32,power_law_1.2,0.4990975856781006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,32,power_law_1.2,0.5445631980895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,32,power_law_1.2,0.5519360065460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,32,power_law_1.2,0.5424960136413575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,32,power_law_1.2,0.532480001449585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,32,power_law_1.2,0.5646336078643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,32,power_law_1.2,0.5906432151794434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,32,power_law_1.2,0.6047743797302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,32,power_law_1.2,0.6279168128967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,32,power_law_1.2,0.7247871875762939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,32,power_law_1.2,0.8462271690368652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,32,power_law_1.2,1.0438655853271483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,32,power_law_1.2,1.3643775939941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,32,power_law_1.2,1.384832000732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,32,power_law_1.2,2.1163967132568358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,32,power_law_1.2,2.8022783279418944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,32,power_law_1.2,4.076953506469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,32,power_law_1.2,5.145395278930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,4,power_law_1.2,30.005044555664064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,4,balanced,0.2461013396581014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,4,balanced,0.4626773198445638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,4,balanced,0.8901973565419515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,4,balanced,1.5699626604715984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,4,balanced,2.9479039510091147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,4,balanced,4.164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,4,balanced,4.17518933614095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,4,balanced,4.153002738952637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,4,balanced,4.16049067179362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,4,balanced,4.169045448303223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,4,balanced,4.191232045491536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,4,balanced,4.207104047139485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,4,balanced,4.237311999003093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,4,balanced,4.26035213470459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,4,power_law_1.2,36.56765441894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,4,balanced,4.29260794321696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,4,balanced,4.327424049377441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,4,balanced,4.385450681050618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,4,balanced,4.713130633036296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,4,balanced,4.698453267415364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,4,balanced,5.0908158620198565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,4,balanced,4.948458671569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,4,balanced,5.232277234395345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,4,balanced,5.66818110148112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,4,balanced,6.62937609354655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,4,balanced,7.552143732706706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,4,balanced,10.390527725219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,4,balanced,12.78208033243815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,128,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,128,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,128,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,128,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,128,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,128,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,128,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,128,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,128,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,128,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,128,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,128,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,128,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,128,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,128,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,128,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,128,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,128,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,128,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,128,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,128,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,4,power_law_1.2,41.405233764648436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,128,power_law_1.2,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,128,power_law_1.2,0.13393919467926024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,1,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,1,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,1,power_law_1.2,0.09400320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,1,power_law_1.2,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,1,power_law_1.2,0.4378623962402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,1,power_law_1.2,0.6170623779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,1,power_law_1.2,0.7296895980834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,1,power_law_1.2,1.0100735664367675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,1,power_law_1.2,1.0670080184936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,1,power_law_1.2,1.0942463874816895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,1,power_law_1.2,1.1802623748779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,128,power_law_1.2,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,1,power_law_1.2,1.2412927627563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,1,power_law_1.2,1.266483211517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,1,power_law_1.2,1.32423677444458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,1,power_law_1.2,1.4153727531433105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,1,power_law_1.2,1.489510440826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,1,power_law_1.2,1.582489585876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,1,power_law_1.2,1.7784832000732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,1,power_law_1.2,1.9537919998168944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,1,power_law_1.2,2.337376022338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,1,power_law_1.2,2.8180479049682616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,1,power_law_1.2,3.516825485229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,1,power_law_1.2,4.110335922241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,1,power_law_1.2,5.523859024047852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,1,power_law_1.2,6.995148468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,4,power_law_1.2,54.649652099609376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,1,power_law_1.2,9.973760223388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,1,power_law_1.2,12.936601257324218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,128,power_law_1.2,0.36290559768676756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,64,power_law_1.01,0.020684799551963805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,64,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,64,power_law_1.01,0.019865599274635316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,64,power_law_1.01,0.020070399343967437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,64,power_law_1.01,0.020479999482631683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,64,power_law_1.01,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,64,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,64,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,64,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,64,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,64,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,64,power_law_1.01,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,64,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,64,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,64,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,64,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,64,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,64,power_law_1.01,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,64,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,64,power_law_1.01,0.10813440084457397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,64,power_law_1.01,0.12697600126266478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,64,power_law_1.01,0.20108160972595215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,64,power_law_1.01,0.2754431962966919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,64,power_law_1.01,0.46837759017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,64,power_law_1.01,0.6584320068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,128,power_law_1.2,0.5416895866394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,4,power_law_1.2,67.90325927734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,8,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,8,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,8,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,8,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,8,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,8,balanced,0.06929066777229309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,8,balanced,0.21519466241200766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,8,balanced,0.21589332818984985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,8,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,8,balanced,0.21845332781473795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,8,balanced,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,8,balanced,0.2230613430341085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,8,balanced,0.2254506746927897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,8,balanced,0.2295466661453247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,8,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,8,balanced,0.2404693365097046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,8,balanced,0.250709335009257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,8,balanced,0.27135999997456867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,8,balanced,0.2940586606661479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,8,balanced,0.36369065443674725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,8,balanced,0.39765334129333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,8,balanced,0.5165973504384359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,8,balanced,0.734549363454183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,8,balanced,1.1197439829508464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,8,balanced,1.5428266525268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,8,balanced,2.1712212562561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,8,balanced,2.825215975443522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,128,power_law_1.2,0.7305215835571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,16,power_law_1.2,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,16,power_law_1.2,0.17244160175323486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,16,power_law_1.2,0.16588799953460692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,16,power_law_1.2,0.2041856050491333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,16,power_law_1.2,0.09850879907608032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,16,power_law_1.2,0.13393919467926024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,16,power_law_1.2,0.15522559881210327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,16,power_law_1.2,0.14068479537963868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,16,power_law_1.2,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,16,power_law_1.2,0.17879040241241456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,16,power_law_1.2,0.17285120487213135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,16,power_law_1.2,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,16,power_law_1.2,0.22446079254150392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,16,power_law_1.2,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,16,power_law_1.2,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,16,power_law_1.2,0.2461695909500122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,16,power_law_1.2,0.26397440433502195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,16,power_law_1.2,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,16,power_law_1.2,0.33955841064453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,16,power_law_1.2,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,16,power_law_1.2,0.44646401405334474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,16,power_law_1.2,0.6408192157745362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,16,power_law_1.2,0.832307243347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,16,power_law_1.2,1.2359552383422852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,16,power_law_1.2,1.620992088317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,1,power_law_1.01,0.8259584426879882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,1,power_law_1.01,1.4333951950073243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,1,power_law_1.01,2.793267250061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,1,power_law_1.01,4.870143890380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,16,power_law_1.2,3.0627840042114256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,1,power_law_1.01,6.927565002441407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,1,power_law_1.01,11.947417449951171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,1,power_law_1.01,12.68384017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,1,power_law_1.01,13.286195373535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,1,power_law_1.01,13.582131958007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,16,power_law_1.2,3.543040084838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,1,power_law_1.01,13.872735595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,1,power_law_1.01,14.043545532226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,1,power_law_1.01,14.562681579589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,1,power_law_1.01,14.844889831542968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,1,power_law_1.01,15.28115234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,1,power_law_1.01,15.453797912597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,1,power_law_1.01,15.812403869628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,1,power_law_1.01,16.323788452148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,32,power_law_1.01,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,32,power_law_1.01,0.22587521076202394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,32,power_law_1.01,0.22364161014556885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,32,power_law_1.01,0.22323200702667237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,32,power_law_1.01,0.2234368085861206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,32,power_law_1.01,0.15667200088500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,32,power_law_1.01,0.16138240098953247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,32,power_law_1.01,0.1605631947517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,32,power_law_1.01,0.19251199960708618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,1,power_law_1.01,17.045913696289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,32,power_law_1.01,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,32,power_law_1.01,0.1763327956199646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,32,power_law_1.01,0.1968127965927124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,32,power_law_1.01,0.19678720235824584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,32,power_law_1.01,0.23224320411682128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,32,power_law_1.01,0.22300798892974855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,32,power_law_1.01,0.24227840900421144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,32,power_law_1.01,0.2486272096633911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,1,power_law_1.01,17.394688415527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,32,power_law_1.01,0.2942975997924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,32,power_law_1.01,0.3072000026702881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,32,power_law_1.01,0.3827712059020996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,32,power_law_1.01,0.4177919864654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,32,power_law_1.01,0.5154496192932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,32,power_law_1.01,0.591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,32,power_law_1.01,0.9256959915161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,32,power_law_1.01,1.2009471893310546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,1,power_law_1.01,18.687968444824218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,32,power_law_1.01,1.7956863403320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,32,power_law_1.01,2.3631872177124023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,1,power_law_1.01,20.049920654296876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,1,power_law_1.01,23.345350646972655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,1,power_law_1.01,25.608358764648436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,1,power_law_1.01,31.64299621582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,1,power_law_1.01,37.31271667480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,1,power_law_1.01,49.834188842773436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,1,power_law_1.01,63.30839233398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,8,power_law_1.2,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,8,power_law_1.2,0.49315838813781737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,8,power_law_1.2,0.4661248207092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,8,power_law_1.2,0.7514111995697021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,8,power_law_1.2,0.8714240074157715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,8,power_law_1.2,0.6692543983459472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,8,power_law_1.2,0.8435456275939941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,8,power_law_1.2,0.9408512115478516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,8,power_law_1.2,0.9574399948120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,8,power_law_1.2,0.8419327735900879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,8,power_law_1.2,0.8439807891845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,8,power_law_1.2,0.9584639549255372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,8,power_law_1.2,0.9781248092651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,8,power_law_1.2,0.9797568321228027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,8,power_law_1.2,0.9744383811950683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,8,power_law_1.2,1.04017915725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,8,power_law_1.2,1.0868736267089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,8,power_law_1.2,1.128012752532959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,8,power_law_1.2,1.1800576210021974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,8,power_law_1.2,1.3334527969360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,8,power_law_1.2,1.4993151664733886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,8,power_law_1.2,1.718681526184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,2,power_law_1.01,0.21565439701080322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,2,power_law_1.01,0.3596287965774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,8,power_law_1.2,2.0635648727416993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,2,power_law_1.01,0.5234687805175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,2,power_law_1.01,0.8409088134765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,8,power_law_1.2,2.8422016143798827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,2,power_law_1.01,1.1988991737365722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,2,power_law_1.01,1.429708766937256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,8,power_law_1.2,3.5639102935791014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,2,power_law_1.01,1.9159040451049805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,2,power_law_1.01,2.009292793273926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,8,power_law_1.2,5.474099349975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,2,power_law_1.01,2.087116813659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,2,power_law_1.01,2.1581695556640623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,2,power_law_1.01,2.232524871826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,8,power_law_1.2,7.025459289550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,2,power_law_1.01,2.209996795654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,2,power_law_1.01,2.294374465942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,2,power_law_1.01,2.314444732666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,2,power_law_1.01,2.374655914306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,2,power_law_1.01,2.4024703979492186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,2,power_law_1.01,2.401894378662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,2,power_law_1.01,2.568191909790039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,2,power_law_1.01,2.6726400375366213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,2,power_law_1.01,2.797158432006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,2,power_law_1.01,3.045145606994629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,2,power_law_1.01,3.386368179321289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,32,power_law_1.01,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,32,power_law_1.01,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,32,power_law_1.01,0.020883199572563172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,2,power_law_1.01,3.845529556274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,32,power_law_1.01,0.02109439969062805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,32,power_law_1.01,0.021491199731826782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,32,power_law_1.01,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,32,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,32,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,2,power_law_1.01,4.708351898193359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,32,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,32,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,32,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,32,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,32,power_law_1.01,0.0427839994430542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,2,power_law_1.01,5.465907287597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,32,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,32,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,32,power_law_1.01,0.06266239881515503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,32,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,32,power_law_1.01,0.09359359741210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,32,power_law_1.01,0.13557759523391724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,32,power_law_1.01,0.16343040466308595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,2,power_law_1.01,7.34044189453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,32,power_law_1.01,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,32,power_law_1.01,0.3311615943908691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,32,power_law_1.01,0.5552127838134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,32,power_law_1.01,0.7860223770141601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,2,power_law_1.01,9.103155517578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,8,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,8,balanced,0.055125330885251365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,8,balanced,0.2841599980990092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,8,balanced,0.5401599804560343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,8,balanced,1.0320213635762532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,8,balanced,2.0222293535868325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,8,balanced,2.0276907285054526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,8,balanced,2.032639980316162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,8,balanced,2.0358826319376626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,8,balanced,2.0404906272888184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,8,balanced,2.0440746943155923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,8,balanced,2.053290685017904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,8,balanced,2.0577279726664224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,8,balanced,2.0684800148010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,8,balanced,2.083669344584147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,8,balanced,2.094933350880941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,8,balanced,2.1251413027445474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,8,balanced,2.208085378011068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,8,balanced,2.253994623819987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,8,balanced,2.3318187395731607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,8,balanced,2.406912008921305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,8,balanced,2.749098777770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,8,balanced,2.820608139038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,8,balanced,3.0750719706217446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,8,balanced,3.5572052001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,8,balanced,4.444501241048177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,8,balanced,5.5780690511067705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,2,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,2,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,2,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,2,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,2,balanced,0.15359999736150107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,2,balanced,0.35498666763305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,2,balanced,0.35633599758148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,2,balanced,0.3582293192545573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,2,balanced,0.36215468247731525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,2,balanced,0.3630026578903198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,2,balanced,0.3667626778284709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,2,balanced,0.373418649037679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,2,balanced,0.37768534819285077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,2,balanced,0.3848533233006795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,2,balanced,0.3942399819691976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,2,balanced,0.400383989016215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,2,balanced,0.41574398676554364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,2,balanced,0.446122686068217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,2,balanced,0.48298664887746173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,2,balanced,0.5382826725641886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,2,balanced,0.6033066511154175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,2,balanced,0.7717546621958414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,2,balanced,0.9431040287017822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,2,balanced,1.3550933202107747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,2,balanced,1.7169067064921062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,2,balanced,2.4401920636494956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,2,balanced,3.2834558486938477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,64,power_law_1.01,0.33013761043548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,64,power_law_1.01,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,64,power_law_1.01,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,64,power_law_1.01,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,64,power_law_1.01,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,64,power_law_1.01,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,64,power_law_1.01,0.30064640045166013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,64,power_law_1.01,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,64,power_law_1.01,0.29122560024261473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,64,power_law_1.01,0.30658559799194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,64,power_law_1.01,0.255180811882019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,64,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,64,power_law_1.01,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,64,power_law_1.01,0.30945279598236086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,64,power_law_1.01,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,64,power_law_1.01,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,64,power_law_1.01,0.33996798992156985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,64,power_law_1.01,0.40079360008239745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,64,power_law_1.01,0.4014080047607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,64,power_law_1.01,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,64,power_law_1.01,0.5381951808929444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,64,power_law_1.01,0.7997439861297607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,64,power_law_1.01,0.97259521484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,64,power_law_1.01,1.5114239692687987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,64,power_law_1.01,2.1694463729858398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,64,power_law_1.01,3.081011199951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,64,power_law_1.01,4.015718460083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,128,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,128,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,128,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,128,power_law_1.01,0.04604159891605377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,128,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,128,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,128,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,128,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,128,power_law_1.01,0.04852479994297028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,128,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,128,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,128,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,128,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,128,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,128,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,128,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,128,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,128,power_law_1.01,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,128,power_law_1.01,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,128,power_law_1.01,0.15912959575653077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,128,power_law_1.01,0.22425599098205568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,128,power_law_1.01,0.3342335939407349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,128,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,128,power_law_1.01,0.638976001739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,128,power_law_1.01,0.8187904357910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,128,power_law_1.01,1.261567974090576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,128,power_law_1.01,1.7106943130493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,16,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,16,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,16,balanced,0.02951466788848241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,16,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,16,balanced,0.23806933561960855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,16,balanced,0.23944532871246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,16,balanced,0.2404693365097046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,16,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,16,balanced,0.24183466037114462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,16,balanced,0.24285332361857095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,16,balanced,0.2445653279622396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,16,balanced,0.24627200762430826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,16,balanced,0.24727465709050497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,16,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,16,balanced,0.25651200612386066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,16,balanced,0.2585600018501282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,16,balanced,0.26419200499852497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,16,balanced,0.27460267146428424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,16,balanced,0.27665066719055176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,16,balanced,0.31060800949732464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,16,balanced,0.31675734122594196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,16,balanced,0.38228265444437665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,16,balanced,0.38789868354797363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,16,balanced,0.5578933159510294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,16,balanced,0.7038293679555258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,16,balanced,1.0697387059529622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,16,balanced,1.3822293281555176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,64,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,64,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,64,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,64,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,64,power_law_1.01,0.036211198568344115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,64,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,64,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,64,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,64,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,64,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,64,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,64,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,64,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,64,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,64,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,64,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,64,power_law_1.01,0.05077120065689087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,64,power_law_1.01,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,64,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,64,power_law_1.01,0.10096640586853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,64,power_law_1.01,0.1111680030822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,64,power_law_1.01,0.1519487977027893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,64,power_law_1.01,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,64,power_law_1.01,0.3635200023651123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,64,power_law_1.01,0.4710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,64,power_law_1.01,0.6985727787017822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,64,power_law_1.01,1.013145637512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,64,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,64,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,64,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,64,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,64,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,64,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,64,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,64,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,64,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,64,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,64,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,64,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,64,power_law_1.01,0.06572800278663635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,64,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,64,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,64,power_law_1.01,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,64,power_law_1.01,0.10424319505691529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,64,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,64,power_law_1.01,0.16138240098953247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,64,power_law_1.01,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,64,power_law_1.01,0.19804160594940184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,64,power_law_1.01,0.022086399793624877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,64,power_law_1.01,0.32665600776672366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,64,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,64,power_law_1.01,0.393830394744873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,64,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,64,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,64,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,64,power_law_1.01,0.6227968215942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,64,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,64,power_law_1.01,0.023526400327682495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,64,power_law_1.01,0.8331263542175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,64,power_law_1.01,1.4129152297973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,64,power_law_1.01,1.757593536376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,64,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,64,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,64,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,64,power_law_1.01,0.02659200131893158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,64,power_law_1.01,0.027820798754692077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,64,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,64,power_law_1.01,0.03030399978160858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,64,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,64,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,64,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,64,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,64,power_law_1.01,0.07925760149955749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,64,power_law_1.01,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,64,power_law_1.01,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,64,power_law_1.01,0.2654207944869995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,64,power_law_1.01,0.4030464172363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,64,power_law_1.01,0.5306367874145508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,2,balanced,0.04010133445262909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,2,balanced,0.27323732773462933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,2,balanced,0.5287253459294637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,2,balanced,0.5307733217875162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,2,balanced,0.5321386655171713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,2,balanced,0.5358933210372925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,2,balanced,0.5393066803614298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,2,balanced,0.5411839882532755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,2,balanced,0.5486933390299479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,2,balanced,0.5515946547190348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,2,balanced,0.5556906859079996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,2,balanced,0.5575679937998453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,2,balanced,0.5614933172861735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,2,balanced,0.5684906641642252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,2,balanced,0.6087679862976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,2,balanced,0.6355520089467367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,2,balanced,0.6901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,2,balanced,0.6691839694976807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,2,balanced,0.7403519948323568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,2,balanced,0.9412266413370768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,2,balanced,1.1707733472188313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,2,balanced,1.6343040466308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,2,balanced,2.2031359672546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,2,balanced,3.169621467590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,2,balanced,4.08627192179362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,2,balanced,5.792426427205403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,2,balanced,7.545514424641927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,4,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,4,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,4,balanced,0.28433066606521606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,4,balanced,0.5558613141377767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,4,balanced,1.047375996907552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,8,power_law_1.2,0.4569087982177734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,4,balanced,2.0183040301005044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,8,power_law_1.2,0.43130879402160643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,8,power_law_1.2,0.6518784046173096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,4,balanced,2.99946657816569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,8,power_law_1.2,0.6135615825653076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,4,balanced,3.006629308064779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,8,power_law_1.2,0.7432191848754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,8,power_law_1.2,0.8298496246337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,4,balanced,3.014826774597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,8,power_law_1.2,0.7899136066436767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,4,balanced,3.0192639032999673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,8,power_law_1.2,0.8062975883483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,8,power_law_1.2,0.8548352241516113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,4,balanced,3.0303573608398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,8,power_law_1.2,0.8648703575134278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,4,balanced,3.044864018758138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,8,power_law_1.2,0.9174912452697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,8,power_law_1.2,0.8919039726257324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,4,balanced,3.0557759602864585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,8,power_law_1.2,0.9259008407592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,8,power_law_1.2,0.9306112289428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,4,balanced,3.0766080220540366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,8,power_law_1.2,0.9469951629638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,4,balanced,3.1020374298095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,8,power_law_1.2,0.9136128425598145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,8,power_law_1.2,0.991436767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,4,balanced,3.116885185241699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,8,power_law_1.2,1.0602496147155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,4,balanced,3.152554512023926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,8,power_law_1.2,1.2105536460876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,4,balanced,3.2235520680745444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,8,power_law_1.2,1.4764032363891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,8,power_law_1.2,1.7772544860839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,4,balanced,3.289600054423014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,4,balanced,3.4123093287150064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,8,power_law_1.2,2.657075119018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,4,balanced,3.534165382385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,4,balanced,3.815765380859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,8,power_law_1.2,2.3578624725341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,4,balanced,4.1355946858723955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,4,balanced,4.6595414479573565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,4,balanced,5.039786656697591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,8,power_law_1.2,3.9665470123291016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,4,balanced,6.2392317454020185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,4,balanced,7.751338958740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,8,power_law_1.2,4.473651123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,1,power_law_1.01,0.03252480030059814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,1,power_law_1.01,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,1,power_law_1.01,0.4462592124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,1,power_law_1.01,0.6641664028167724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,1,power_law_1.01,0.8847359657287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,1,power_law_1.01,1.4614208221435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,1,power_law_1.01,1.518182373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,1,power_law_1.01,1.5152959823608398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,1,power_law_1.01,1.5962112426757813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,1,power_law_1.01,1.6779264450073241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,1,power_law_1.01,1.6455680847167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,1,power_law_1.01,1.7262592315673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,1,power_law_1.01,1.722163200378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,1,power_law_1.01,1.7303552627563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,1,power_law_1.01,1.7920000076293945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,1,power_law_1.01,1.8173952102661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,1,power_law_1.01,1.8423807144165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,1,power_law_1.01,1.9091455459594726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,1,power_law_1.01,1.9968000411987306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,1,power_law_1.01,2.205695915222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,1,power_law_1.01,2.427903938293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,1,power_law_1.01,2.9468671798706056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,1,power_law_1.01,3.2088062286376955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,1,power_law_1.01,4.170956802368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,1,power_law_1.01,5.243904113769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,1,power_law_1.01,7.411711883544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,1,power_law_1.01,9.639116668701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,8,power_law_1.2,5.677465438842773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,8,power_law_1.2,8.297267150878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,32,power_law_1.2,1.0788543701171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,32,power_law_1.2,1.5413248062133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,32,power_law_1.2,1.5372096061706544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,32,power_law_1.2,1.5388671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,32,power_law_1.2,1.5380096435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,32,power_law_1.2,1.3195263862609863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,32,power_law_1.2,0.9768704414367676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,32,power_law_1.2,1.32423677444458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,32,power_law_1.2,1.084620761871338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,32,power_law_1.2,1.265459156036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,32,power_law_1.2,1.4125056266784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,32,power_law_1.2,1.3735936164855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,32,power_law_1.2,1.3813759803771972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,32,power_law_1.2,1.4249983787536622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,32,power_law_1.2,1.3617152214050292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,32,power_law_1.2,1.425203227996826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,32,power_law_1.2,1.5370112419128419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,2,power_law_1.2,0.3848191976547241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,2,power_law_1.2,0.6676479816436768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,32,power_law_1.2,1.665011215209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,2,power_law_1.2,0.9123647689819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,32,power_law_1.2,1.588428783416748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,2,power_law_1.2,1.4063615798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,32,power_law_1.2,1.9734527587890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,2,power_law_1.2,1.863270378112793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,32,power_law_1.2,2.3207616806030273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,2,power_law_1.2,2.798387145996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,32,power_law_1.2,2.8923904418945314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,2,power_law_1.2,3.6364288330078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,32,power_law_1.2,3.3277633666992186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,2,power_law_1.2,3.8965248107910155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,32,power_law_1.2,4.595711898803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,2,power_law_1.2,4.1056255340576175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,2,power_law_1.2,4.097843170166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,32,power_law_1.2,5.604940795898438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,2,power_law_1.2,4.027187347412109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,2,power_law_1.2,4.526079940795898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,32,power_law_1.2,8.917401885986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,2,power_law_1.2,4.465030288696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,2,power_law_1.2,4.639731216430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,2,power_law_1.2,4.759347152709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,32,power_law_1.2,12.011724853515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,2,power_law_1.2,4.878950500488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,2,power_law_1.2,5.028659057617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,2,power_law_1.2,5.1308544158935545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,2,power_law_1.2,5.389926528930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,2,power_law_1.2,5.7298942565917965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,2,power_law_1.2,6.122905731201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,2,power_law_1.2,7.129087829589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,2,power_law_1.2,7.569203186035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,2,power_law_1.2,9.591366577148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,2,power_law_1.2,10.848863983154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,2,power_law_1.2,14.045184326171874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,2,power_law_1.2,16.96378936767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,4,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,4,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,4,power_law_1.2,0.17182719707489014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,4,power_law_1.2,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,4,power_law_1.2,0.2791424036026001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,4,power_law_1.2,0.4001791954040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,4,power_law_1.2,0.4030464172363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,4,power_law_1.2,0.43765759468078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,4,power_law_1.2,0.4321280002593994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,4,power_law_1.2,0.4511744022369385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,4,power_law_1.2,0.4302847862243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,4,power_law_1.2,0.44359679222106935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,4,power_law_1.2,0.44953598976135256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,4,power_law_1.2,0.44994559288024905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,4,power_law_1.2,0.44851198196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,4,power_law_1.2,0.481279993057251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,4,power_law_1.2,0.48619518280029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,4,power_law_1.2,0.5160895824432373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,4,power_law_1.2,0.5373824119567872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,4,power_law_1.2,0.6236159801483154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,4,power_law_1.2,0.7403456211090088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,4,power_law_1.2,1.0309632301330567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,4,power_law_1.2,1.0893183708190919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,4,power_law_1.2,1.3811712265014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,16,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,16,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,16,power_law_1.2,0.02948479950428009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,16,power_law_1.2,0.029260799288749695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,16,power_law_1.2,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,16,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,16,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,16,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,16,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,16,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,16,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,16,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,16,power_law_1.2,0.04071680009365082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,16,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,16,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,16,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,16,power_law_1.2,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,16,power_law_1.2,0.11612160205841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,16,power_law_1.2,0.2031615972518921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,16,power_law_1.2,0.3190783977508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,4,power_law_1.2,2.0539392471313476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,16,power_law_1.2,0.4536320209503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,1,power_law_1.01,0.8357888221740722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,1,power_law_1.01,1.4624768257141114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,1,power_law_1.01,2.8889087677001952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,1,power_law_1.01,5.037055969238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,1,power_law_1.01,7.198310089111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,1,power_law_1.01,12.054118347167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,16,power_law_1.2,0.6625279903411865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,1,power_law_1.01,12.915303039550782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,1,power_law_1.01,13.368730163574218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,1,power_law_1.01,13.944627380371093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,4,power_law_1.2,2.8821504592895506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,16,power_law_1.2,0.8466431617736816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,1,power_law_1.01,14.000537109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,1,power_law_1.01,14.64074249267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,1,power_law_1.01,14.651187133789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,1,power_law_1.01,15.109120178222657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,1,power_law_1.01,15.6579833984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,1,power_law_1.01,15.996109008789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,1,power_law_1.01,16.550706481933595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,1,power_law_1.01,17.231053161621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,1,power_law_1.01,17.974476623535157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,16,power_law_1.2,1.6648191452026366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,1,power_law_1.01,18.60648956298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,1,power_law_1.01,19.9841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,1,power_law_1.01,20.001177978515624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,1,power_law_1.01,23.621632385253907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,16,power_law_1.2,2.002739143371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,1,power_law_1.01,24.40396728515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,16,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,16,balanced,0.02456533412138621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,16,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,16,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,16,balanced,0.030346666773160298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,16,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,16,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,16,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,1,power_law_1.01,30.273126220703126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,16,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,16,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,16,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,16,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,16,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,16,balanced,0.04146666576464971
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,16,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,16,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,16,balanced,0.056832000613212585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,16,balanced,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,16,balanced,0.07765333354473114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,16,balanced,0.1539413332939148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,16,balanced,0.1962666710217794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,16,balanced,0.3304106593132019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,16,balanced,0.4437013467152913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,8,balanced,0.019797333826621372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,8,balanced,0.019797333826621372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,8,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,8,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,8,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,8,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,8,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,8,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,8,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,8,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,8,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,8,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,8,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,8,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,8,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,8,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,8,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,8,balanced,0.04128533353408178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,8,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,8,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,8,balanced,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,8,balanced,0.11161599556605022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,8,balanced,0.21282132466634116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,8,balanced,0.276309331258138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,8,balanced,0.4763306776682536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,8,balanced,0.696832021077474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,1,power_law_1.01,34.9296630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,1,power_law_1.01,48.77107238769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,4,power_law_1.2,3.6145153045654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,1,power_law_1.01,56.63006591796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,32,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,32,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,32,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,32,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,32,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,32,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,32,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,32,power_law_1.2,0.029068800806999206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,32,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,32,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,32,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,32,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,32,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,32,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,32,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,32,power_law_1.2,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,32,power_law_1.2,0.1052672028541565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,32,power_law_1.2,0.13905919790267945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,32,power_law_1.2,0.159334397315979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,32,power_law_1.2,0.20643839836120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,32,power_law_1.2,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,32,power_law_1.2,0.506060791015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,32,power_law_1.2,0.861184024810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,32,power_law_1.2,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,128,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,128,balanced,0.054085334142049156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,128,balanced,0.06297599772612254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,128,balanced,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,128,balanced,0.22169599930445352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,128,balanced,0.2228906750679016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,128,balanced,0.22235733270645142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,128,balanced,0.22406933705012003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,128,balanced,0.22715733448664346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,128,balanced,0.22920533021291098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,128,balanced,0.23040000597635904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,128,balanced,0.23534933725992838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,128,balanced,0.23754666248957315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,128,balanced,0.2435413400332133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,128,balanced,0.25545599063237506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,128,balanced,0.2725546757380168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,128,balanced,0.29525333642959595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,128,balanced,0.3136853377024333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,128,balanced,0.35788798332214355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,128,balanced,0.4432053168614705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,128,balanced,0.5265066623687744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,128,balanced,0.6010880072911581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,128,balanced,0.8277333577473959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,128,balanced,1.0864640076955159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,64,balanced,0.023013333479563396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,64,balanced,0.02250133454799652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,64,balanced,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,64,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,64,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,64,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,64,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,64,balanced,0.024901332954565685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,64,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,64,balanced,0.02491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,64,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,64,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,64,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,64,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,64,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,64,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,64,balanced,0.03088533381621043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,64,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,32,power_law_1.2,1.59170560836792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,64,balanced,0.035829332967599235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,64,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,64,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,64,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,64,balanced,0.08516266942024231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,64,balanced,0.16452266772588095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,64,balanced,0.28962133328119916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,64,balanced,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,32,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,32,power_law_1.01,0.04010879993438721
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,32,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,32,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,32,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,32,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,32,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,32,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,32,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,32,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,32,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,32,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,32,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,32,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,32,power_law_1.01,0.055289602279663085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,32,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,32,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,32,power_law_1.01,0.08212479948997498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,32,power_law_1.01,0.11427839994430541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,32,power_law_1.01,0.12554240226745605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,32,power_law_1.01,0.18984960317611693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,32,power_law_1.01,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,32,power_law_1.01,0.36126720905303955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,32,power_law_1.01,0.49170560836791993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,32,power_law_1.01,0.8384511947631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,32,power_law_1.01,1.1446271896362306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,32,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,32,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,32,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,32,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,32,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,32,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,32,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,32,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,32,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,32,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,32,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,32,power_law_1.2,0.03909760117530823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,32,power_law_1.2,0.03971840143203735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,32,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,1,balanced,0.33177600304285687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,1,balanced,0.5821439822514852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,32,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,1,balanced,1.1182080109914143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,32,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,1,balanced,2.19270928700765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,32,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,32,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,32,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,1,balanced,4.340383847554524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,32,power_law_1.2,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,32,power_law_1.2,0.10342400074005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,32,power_law_1.2,0.14274560213088988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,1,balanced,5.396650950113933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,32,power_law_1.2,0.20623359680175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,32,power_law_1.2,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,1,balanced,5.413717269897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,32,power_law_1.2,0.4782080173492432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,32,power_law_1.2,0.7679999828338623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,1,balanced,5.434368133544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,32,power_law_1.2,1.1935744285583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,1,balanced,5.453823725382487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,1,balanced,5.472426732381185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,1,balanced,5.505365371704102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,1,balanced,5.541717529296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,1,balanced,5.577386856079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,1,balanced,5.63968022664388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,1,balanced,5.705898920694987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,1,balanced,5.9255415598551435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,1,balanced,6.028799692789714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,1,balanced,6.216021219889323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,1,balanced,6.393856048583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,1,balanced,7.302656173706055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,1,balanced,6.8428694407145185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,1,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,1,power_law_1.01,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,1,balanced,7.718229293823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,1,power_law_1.01,0.34816000461578367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,1,power_law_1.01,0.667852783203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,1,power_law_1.01,0.9965248107910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,1,power_law_1.01,1.3232128143310546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,1,balanced,8.653141021728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,1,power_law_1.01,1.8749439239501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,1,power_law_1.01,1.9338943481445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,1,power_law_1.01,2.024857521057129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,1,balanced,10.663935979207357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,1,power_law_1.01,2.0961151123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,1,power_law_1.01,2.108415985107422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,1,power_law_1.01,2.2577152252197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,1,balanced,13.491711934407553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,1,power_law_1.01,2.225971221923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,1,power_law_1.01,2.348851203918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,1,power_law_1.01,2.359084892272949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,1,power_law_1.01,2.487705612182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,1,power_law_1.01,2.568806457519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,1,balanced,19.089749654134113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,1,power_law_1.01,2.715033531188965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,1,power_law_1.01,2.8239871978759767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,1,power_law_1.01,3.081216049194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,1,power_law_1.01,3.2266239166259765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,1,power_law_1.01,3.7119998931884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,1,balanced,24.6471684773763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,1,power_law_1.01,4.070604705810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,1,power_law_1.01,5.2236286163330075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,1,power_law_1.01,6.07006721496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,1,power_law_1.01,8.31426544189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,1,power_law_1.01,10.45749740600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,1,power_law_1.2,0.24657919406890869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,1,power_law_1.2,0.45055999755859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,1,power_law_1.2,0.7841792106628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,1,power_law_1.2,1.1898880004882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,1,power_law_1.2,1.557913589477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,1,power_law_1.2,2.8788736343383787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,1,power_law_1.2,3.0244863510131834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,1,power_law_1.2,3.1696895599365233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,1,power_law_1.2,3.2890880584716795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,1,power_law_1.2,3.337420654296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,1,power_law_1.2,3.322470474243164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,1,power_law_1.2,3.421772766113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,1,power_law_1.2,3.443097686767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,1,power_law_1.2,3.5186687469482423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,1,power_law_1.2,3.566387176513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,1,power_law_1.2,3.60816650390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,1,power_law_1.2,3.6994686126708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,1,power_law_1.2,3.8836223602294924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,1,power_law_1.2,4.06036491394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,1,power_law_1.2,4.4886016845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,1,power_law_1.2,5.0243583679199215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,1,power_law_1.2,5.965209579467773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,64,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,64,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,64,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,64,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,64,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,1,power_law_1.2,7.038156890869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,64,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,64,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,64,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,64,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,64,power_law_1.01,0.03255679905414581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,64,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,64,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,64,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,1,power_law_1.2,9.076121520996093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,64,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,64,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,64,power_law_1.01,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,64,power_law_1.01,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,64,power_law_1.01,0.17121280431747438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,64,power_law_1.01,0.31703040599822996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,64,power_law_1.01,0.39874560832977296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,64,power_law_1.01,0.6735871791839599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,1,power_law_1.2,10.748313903808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,1,power_law_1.2,15.090278625488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,1,power_law_1.2,19.4840576171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,16,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,16,power_law_1.2,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,16,power_law_1.2,0.23101439476013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,16,power_law_1.2,0.2871295928955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,16,power_law_1.2,0.2486272096633911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,16,power_law_1.2,0.296345591545105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,16,power_law_1.2,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,16,power_law_1.2,0.265011191368103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,16,power_law_1.2,0.2748415946960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,16,power_law_1.2,0.24432640075683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,16,power_law_1.2,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,16,power_law_1.2,0.2631680011749268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,16,power_law_1.2,0.2641792058944702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,16,power_law_1.2,0.28241920471191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,16,power_law_1.2,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,16,power_law_1.2,0.3280895948410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,16,power_law_1.2,0.33710079193115233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,16,power_law_1.2,0.37253119945526125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,16,power_law_1.2,0.41943039894104006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,16,power_law_1.2,0.4655104160308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,16,power_law_1.2,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,16,power_law_1.2,0.7679999828338623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,16,power_law_1.2,0.9533439636230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,16,power_law_1.2,1.3764608383178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,16,power_law_1.2,1.7330175399780274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,16,power_law_1.2,2.817024040222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,16,power_law_1.2,3.6843521118164064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,1,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,1,balanced,0.03973866750796636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,1,balanced,0.16264533003171286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,1,balanced,0.3715413411458333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,1,balanced,0.6978240013122559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,1,balanced,0.9437867005666097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,1,balanced,0.9492479960123698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,1,balanced,0.953658660252889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,1,balanced,0.9586346944173177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,1,balanced,0.9627306461334229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,1,balanced,0.9712639649709066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,1,balanced,1.0023039976755779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,1,balanced,0.9874613285064697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,1,balanced,1.0002773602803547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,1,balanced,1.0122240384419758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,1,balanced,1.0260480244954426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,1,balanced,1.0525013605753581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,1,balanced,1.1037013530731201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,1,balanced,1.1574613253275554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,1,balanced,1.2554240226745605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,1,balanced,1.3595306078592937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,1,balanced,1.5894187291463215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,1,balanced,1.82476806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,1,balanced,2.3045120239257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,1,balanced,2.8035147984822593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,1,balanced,3.9307947158813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,1,balanced,5.003424008687337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,2,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,2,power_law_1.01,0.16732159852981568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,2,power_law_1.01,0.30310399532318116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,2,power_law_1.01,0.4005887985229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,2,power_law_1.01,0.4767744064331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,2,power_law_1.01,0.7647232055664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,2,power_law_1.01,0.7866367816925048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,2,power_law_1.01,0.8065024375915527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,2,power_law_1.01,0.8458239555358886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,2,power_law_1.01,0.8466431617736816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,2,power_law_1.01,0.832307243347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,2,power_law_1.01,0.8675328254699707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,2,power_law_1.01,0.8984576225280761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,2,power_law_1.01,0.911564826965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,2,power_law_1.01,0.951091194152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,2,power_law_1.01,0.9609215736389161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,2,power_law_1.01,0.9981951713562012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,2,power_law_1.01,1.04017915725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,2,power_law_1.01,1.1018239974975585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,2,power_law_1.01,1.223680019378662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,2,power_law_1.01,1.4223360061645507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,2,power_law_1.01,1.79998722076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,2,power_law_1.01,2.183782386779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,2,power_law_1.01,2.8016639709472657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,16,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,16,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,16,balanced,0.05153599878152212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,16,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,16,balanced,0.279039998849233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,2,power_law_1.01,3.438796615600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,16,balanced,0.5437440077463785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,16,balanced,0.7978666623433431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,16,balanced,0.801962693532308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,16,balanced,0.8031573295593262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,16,balanced,0.8038400014241537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,16,balanced,0.799232006072998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,16,balanced,0.8048640092213949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,16,balanced,0.8058880170186361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,2,power_law_1.01,5.300019073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,16,balanced,0.8122026920318604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,16,balanced,0.8205653031667074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,16,balanced,0.8231253623962402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,16,balanced,0.8376320203145345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,16,balanced,0.861525297164917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,16,balanced,0.8901973565419515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,16,balanced,0.93559463818868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,16,balanced,0.9716053009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,2,power_law_1.01,6.820658874511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,16,balanced,1.0734933217366536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,16,balanced,1.1921066443125408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,16,balanced,1.4172159830729167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,16,balanced,1.6585386594136555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,16,balanced,2.103125254313151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,16,balanced,2.602666695912679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,1,power_law_1.01,0.5148672103881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,1,power_law_1.01,0.7372799873352051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,1,power_law_1.01,0.9846783638000488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,1,power_law_1.01,1.6510976791381835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,1,power_law_1.01,1.7311744689941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,1,power_law_1.01,1.7504255294799804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,1,power_law_1.01,1.7634944915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,1,power_law_1.01,1.7741823196411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,1,power_law_1.01,1.8001920700073242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,1,power_law_1.01,1.8309120178222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,1,power_law_1.01,1.9339263916015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,1,power_law_1.01,1.98287353515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,1,power_law_1.01,2.0283391952514647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,1,power_law_1.01,2.082803153991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,1,power_law_1.01,2.224537658691406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,1,power_law_1.01,2.3359487533569334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,1,power_law_1.01,2.5153535842895507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,1,power_law_1.01,2.915532875061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,1,power_law_1.01,3.308339309692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,1,power_law_1.01,4.1699073791503904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,1,power_law_1.01,4.831232070922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,1,power_law_1.01,6.508544158935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,1,balanced,0.29388266801834106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,1,balanced,0.5321386655171713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,1,balanced,1.0297866662343342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,1,balanced,1.0210986932118733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,1,balanced,1.0279146830240886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,1,balanced,1.0357706546783447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,1,balanced,1.044650634129842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,1,balanced,1.0683733622233074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,1,balanced,1.0562559763590496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,1,balanced,1.0654719670613606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,1,balanced,1.0787839889526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,1,balanced,1.0951680342356365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,1,balanced,1.113258679707845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,1,balanced,1.1372959613800049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,1,balanced,1.1992479960123699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,1,balanced,1.2206079959869385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,1,balanced,1.2311840057373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,1,balanced,1.3982720375061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,1,balanced,1.5206400553385417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,1,balanced,1.9215359687805176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,1,balanced,2.39957332611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,1,balanced,3.3669118881225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,1,balanced,4.338346799214681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,1,balanced,6.283066431681315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,1,balanced,8.455850601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,1,power_law_1.01,7.973887634277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,1,balanced,12.230144500732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,1,balanced,16.371541341145832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,1,power_law_1.01,11.053465270996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,1,power_law_1.01,15.781683349609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,1,power_law_1.01,23.5509765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,8,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,8,power_law_1.2,0.15564800500869752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,8,power_law_1.2,0.0960319995880127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,8,power_law_1.2,0.23713281154632568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,8,power_law_1.2,0.3047424077987671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,8,power_law_1.2,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,8,power_law_1.2,0.3405823945999146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,8,power_law_1.2,0.3221503973007202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,8,power_law_1.2,0.3020607948303223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,8,power_law_1.2,0.3258368015289307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,8,power_law_1.2,0.3211071968078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,8,power_law_1.2,0.31801600456237794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,8,power_law_1.2,0.3579904079437256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,8,power_law_1.2,0.3354624032974243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,8,power_law_1.2,0.3473407983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,8,power_law_1.2,0.35676159858703616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,8,power_law_1.2,0.3548991918563843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,8,power_law_1.2,0.39360001087188723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,8,power_law_1.2,0.40611839294433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,8,power_law_1.2,0.4444159984588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,8,power_law_1.2,0.4943871974945068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,8,power_law_1.2,0.5822463989257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,8,power_law_1.2,0.7988927841186524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,8,power_law_1.2,1.0190848350524901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,8,power_law_1.2,1.2488703727722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,8,power_law_1.2,1.895212745666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,8,power_law_1.2,2.4612863540649412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,2,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,2,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,2,balanced,0.28296534220377606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,2,balanced,0.5299199819564819
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,2,balanced,1.024341344833374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,2,balanced,2.0053332646687827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,2,balanced,2.9784746170043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,2,balanced,2.986837387084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,2,balanced,2.9958826700846353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,2,balanced,3.0055999755859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,2,balanced,3.022336006164551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,2,balanced,3.0407679875691733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,2,balanced,3.057493209838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,2,balanced,3.087360064188639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,2,balanced,3.1165440877278647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,2,balanced,3.1411145528157554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,2,balanced,3.1989758809407554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,2,balanced,3.3049599329630532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,2,balanced,3.39847469329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,2,balanced,3.5909973780314126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,2,balanced,3.7942612965901694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,2,balanced,4.210517247517903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,16,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,16,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,16,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,16,balanced,0.29047467311223346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,2,balanced,4.560895919799805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,16,balanced,0.5374293327331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,16,balanced,1.0431146621704102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,16,balanced,1.0477226575215657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,16,balanced,1.035434643427531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,16,balanced,1.0400426387786865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,2,balanced,5.489487965901692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,16,balanced,1.040554682413737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,16,balanced,1.0455040136973064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,16,balanced,1.0499413013458252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,16,balanced,1.0547146797180176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,16,balanced,1.063594659169515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,2,balanced,6.290602366129558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,16,balanced,1.0752000013987224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,16,balanced,1.0845866998036702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,16,balanced,1.0994346936543782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,16,balanced,1.13100798924764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,16,balanced,1.1661653518676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,16,balanced,1.2306666374206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,2,balanced,7.995733261108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,16,balanced,1.2975786526997883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,16,balanced,1.385983943939209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,16,balanced,1.497770627339681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,16,balanced,1.7440427144368489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,2,balanced,9.782954533894857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,16,balanced,2.099712053934733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,16,balanced,2.918229420979818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,16,balanced,3.5932159423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,8,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,8,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,8,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,8,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,8,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,8,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,8,balanced,0.03819733361403147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,8,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,8,balanced,0.03958933303753535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,8,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,8,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,8,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,8,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,8,balanced,0.08086933195590973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,8,balanced,0.14847999811172485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,8,balanced,0.22220800320307413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,8,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,8,balanced,0.3218773404757182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,8,balanced,0.38809601465861004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,8,balanced,0.5249706506729126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,8,balanced,0.7121919790903727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,8,balanced,1.1883520285288494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,8,balanced,1.6061439514160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,1,power_law_1.01,28.160205078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,16,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,16,power_law_1.2,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,16,power_law_1.2,0.02109439969062805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,16,power_law_1.2,0.02088959962129593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,16,power_law_1.2,0.021299199759960176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,16,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,16,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,16,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,16,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,16,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,16,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,16,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,16,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,16,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,16,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,16,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,16,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,16,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,16,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,16,power_law_1.2,0.09071360230445862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,16,power_law_1.2,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,16,power_law_1.2,0.18309119939804078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,16,power_law_1.2,0.23121280670166017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,16,power_law_1.2,0.37519359588623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,16,power_law_1.01,0.061222398281097413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,16,power_law_1.01,0.1968127965927124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,16,power_law_1.01,0.1458176016807556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,16,power_law_1.01,0.11182080507278443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,16,power_law_1.01,0.19988479614257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,16,power_law_1.01,0.13188480138778685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,16,power_law_1.01,0.13557759523391724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,16,power_law_1.01,0.19148800373077393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,16,power_law_1.01,0.14172159433364867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,16,power_law_1.01,0.14090240001678467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,16,power_law_1.01,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,16,power_law_1.01,0.15892479419708253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,16,power_law_1.01,0.20848639011383058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,16,power_law_1.01,0.19496959447860718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,16,power_law_1.01,0.20439040660858154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,16,power_law_1.01,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,16,power_law_1.01,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,16,power_law_1.01,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,16,power_law_1.01,0.2684927940368652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,16,power_law_1.01,0.2987967967987061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,16,power_law_1.01,0.3573760032653809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,16,power_law_1.01,0.451584005355835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,16,power_law_1.01,0.6492159843444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,16,power_law_1.01,0.9736191749572753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,16,power_law_1.01,1.3760512351989747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,16,power_law_1.01,2.127462387084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,16,power_law_1.01,2.6245119094848635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,16,power_law_1.2,0.7583744049072265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,1,power_law_1.01,0.2189311981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,1,power_law_1.01,0.36249599456787107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,1,power_law_1.01,0.6674431800842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,1,power_law_1.01,1.3023232460021972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,1,power_law_1.01,1.944985580444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,1,power_law_1.01,2.696396827697754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,1,power_law_1.01,3.5936256408691407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,1,power_law_1.01,3.9254016876220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,1,power_law_1.01,3.9362560272216798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,1,power_law_1.01,4.252671813964843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,1,power_law_1.01,4.242841720581055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,1,power_law_1.01,4.465254211425782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,1,power_law_1.01,4.440678405761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,1,power_law_1.01,4.594073486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,1,power_law_1.01,4.688896179199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,1,power_law_1.01,4.8175102233886715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,1,power_law_1.01,4.875263977050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,1,power_law_1.01,5.109145736694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,1,power_law_1.01,5.286912155151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,1,power_law_1.01,5.493344116210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,1,power_law_1.01,5.774540710449219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,1,power_law_1.01,6.568550109863281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,1,power_law_1.01,7.2056831359863285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,1,power_law_1.01,8.804966735839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,1,power_law_1.01,10.338918304443359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,1,power_law_1.01,13.646015930175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,16,power_law_1.2,1.054310417175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,1,power_law_1.01,16.275660705566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,16,power_law_1.01,0.31600639820098875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,16,power_law_1.01,0.5464064121246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,16,power_law_1.01,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,16,power_law_1.01,0.4880191802978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,16,power_law_1.01,0.5031936168670654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,16,power_law_1.01,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,16,power_law_1.01,0.49111042022705076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,16,power_law_1.01,0.5271552085876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,16,power_law_1.01,0.4640768051147461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,16,power_law_1.01,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,16,power_law_1.01,0.4841152191162109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,16,power_law_1.01,0.5140416145324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,16,power_law_1.01,0.5093376159667968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,16,power_law_1.01,0.5465983867645263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,16,power_law_1.01,0.5543935775756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,16,power_law_1.01,0.5156864166259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,16,power_law_1.01,0.5855040073394775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,16,power_law_1.01,0.627507209777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,16,power_law_1.01,0.5998591899871826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,16,power_law_1.01,0.6948863983154296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,16,power_law_1.01,0.7440383911132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,16,power_law_1.01,0.9271103858947753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,16,power_law_1.01,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,16,power_law_1.01,1.1997183799743651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,16,power_law_1.01,0.2248703956604004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,16,power_law_1.01,0.21954560279846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,16,power_law_1.01,0.23900160789489747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,16,power_law_1.01,1.576140785217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,16,power_law_1.01,0.14315520524978637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,16,power_law_1.01,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,16,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,16,power_law_1.01,2.00314884185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,16,power_law_1.01,3.0425088882446287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,16,power_law_1.01,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,16,power_law_1.01,0.23879680633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,16,power_law_1.01,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,16,power_law_1.01,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,16,power_law_1.01,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,16,power_law_1.01,3.5086334228515623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,16,power_law_1.01,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,16,power_law_1.01,0.2619391918182373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,16,power_law_1.01,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,16,power_law_1.01,0.24821760654449462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,16,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,16,power_law_1.01,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,16,power_law_1.01,0.27647359371185304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,16,power_law_1.01,0.3737600088119507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,16,power_law_1.01,0.43233280181884765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,16,power_law_1.01,0.5285888195037842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,16,power_law_1.01,0.6467584133148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,16,power_law_1.01,1.2015616416931152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,16,power_law_1.01,1.656831932067871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,16,power_law_1.01,2.0850688934326174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,16,power_law_1.01,2.8444671630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,16,balanced,0.023381332556406658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,16,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,16,balanced,0.022170667846997578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,16,balanced,0.03735466549793879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,16,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,16,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,16,balanced,0.02438933402299881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,16,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,16,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,16,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,16,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,16,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,16,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,16,balanced,0.026778665681680042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,16,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,16,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,16,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,16,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,16,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,16,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,16,balanced,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,16,balanced,0.08277333279450734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,16,balanced,0.16554666558901468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,16,balanced,0.2476373314857483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,16,balanced,0.36556800206502277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,16,balanced,0.5138560136159261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,4,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,4,balanced,0.04469866553942362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,4,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,4,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,4,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,4,balanced,0.2959360082944234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,4,balanced,0.29815467198689777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,4,balanced,0.2935466567675273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,4,balanced,0.2961066762606303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,4,balanced,0.2986666758855184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,4,balanced,0.3031040032704671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,4,balanced,0.3102719982465108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,4,balanced,0.31522132953008014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,4,balanced,0.3217066725095113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,4,balanced,0.3338186740875244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,4,balanced,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,4,balanced,0.36164267857869464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,4,balanced,0.40396801630655926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,4,balanced,0.44049068291982013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,4,balanced,0.5090986490249634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,4,balanced,0.6145706574122111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,4,balanced,0.8277333577473959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,4,balanced,1.0530133247375488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,4,balanced,1.5706453323364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,4,balanced,2.175146738688151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,4,balanced,3.257685343424479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,4,balanced,4.333567937215169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,64,balanced,0.04214933514595032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,64,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,64,balanced,0.036346666514873505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,64,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,64,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,64,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,64,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,64,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,64,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,64,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,64,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,64,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,64,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,64,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,64,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,64,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,64,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,64,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,64,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,64,balanced,0.07509333391984303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,64,balanced,0.08959999680519104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,64,balanced,0.18705066045125326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,64,balanced,0.2553173303604126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,64,balanced,0.3438933293024699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,64,balanced,0.41369601090749103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,64,balanced,0.5838506619135538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,64,balanced,0.7709013621012369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,8,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,8,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,8,balanced,0.1397760013739268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,64,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,64,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,64,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,64,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,64,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,64,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,64,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,64,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,64,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,64,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,64,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,64,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,64,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,64,balanced,0.04743466774622599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,64,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,64,balanced,0.06229333579540253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,64,balanced,0.10001066327095032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,8,balanced,0.353770653406779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,8,balanced,0.6681546370188395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,8,balanced,1.2965546449025471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,8,balanced,1.3004480202992756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,8,balanced,1.3015039761861165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,8,balanced,1.3035519917805989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,8,balanced,1.3045653502146404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,64,balanced,0.09215999643007915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,64,balanced,0.2065066695213318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,8,balanced,1.310863971710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,64,balanced,0.27476267019907635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,8,balanced,1.315669298171997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,64,balanced,0.41369601090749103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,8,balanced,1.3190826574961345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,8,balanced,1.323520024617513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,64,balanced,0.4983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,8,balanced,1.336309274037679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,8,balanced,1.3450239499409993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,8,balanced,1.3619200388590496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,8,balanced,1.420789400736491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,8,balanced,1.4446934064229329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,8,balanced,1.4310399691263835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,8,balanced,1.491114616394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,8,balanced,1.5673920313517253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,8,balanced,1.6815786361694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,8,balanced,1.8597547213236492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,8,balanced,2.0706987380981445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,8,balanced,2.557781378428141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,8,balanced,3.294720013936361
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.10198400020599366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.2799616098403931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.451584005355835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.6047616004943848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.7344128131866455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,1,power_law_1.2,1.0078207969665527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,1,power_law_1.2,1.0612607955932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,1,power_law_1.2,1.1040767669677733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,1,power_law_1.2,1.202175998687744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,1,power_law_1.2,1.2199935913085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,1,power_law_1.2,1.3207551956176757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,1,power_law_1.2,1.386905574798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,1,power_law_1.2,1.4936063766479493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,1,power_law_1.2,1.5376383781433105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,1,power_law_1.2,1.6420799255371095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,1,power_law_1.2,1.8745344161987305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,1,power_law_1.2,2.1180416107177735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,1,power_law_1.2,2.5650815963745117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,1,power_law_1.2,3.034111976623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,1,power_law_1.2,3.9493633270263673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,1,power_law_1.2,4.918681716918945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,1,power_law_1.2,6.76147232055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,1,power_law_1.2,8.579891204833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,1,power_law_1.2,12.340614318847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,32,power_law_1.2,0.3311487913131714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,32,power_law_1.2,0.4306943893432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,32,power_law_1.2,0.4278143882751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,32,power_law_1.2,0.4286464214324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,1,power_law_1.2,16.03765106201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,32,power_law_1.2,0.4157440185546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,32,power_law_1.2,0.399564790725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,32,power_law_1.2,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,32,power_law_1.2,0.3907583951950073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,32,power_law_1.2,0.36659200191497804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,32,power_law_1.2,0.37354240417480467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,32,power_law_1.2,0.43130879402160643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,32,power_law_1.2,0.40284161567687987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,32,power_law_1.2,0.3880959987640381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,32,power_law_1.2,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,32,power_law_1.2,0.4429823875427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,32,power_law_1.2,0.4454400062561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,32,power_law_1.2,0.4388864040374756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,32,power_law_1.2,0.5122047901153565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,32,power_law_1.2,0.5369855880737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,32,power_law_1.2,0.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,32,power_law_1.2,0.6850560188293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,32,power_law_1.2,0.87838716506958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,32,power_law_1.2,1.135206413269043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,32,power_law_1.2,1.719500732421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,32,power_law_1.2,2.0969472885131837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,32,power_law_1.2,3.263488006591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,32,power_law_1.2,4.308172988891601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,1,power_law_1.2,0.34713599681854246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,1,power_law_1.2,0.5677055835723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,1,power_law_1.2,1.095475196838379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,1,power_law_1.2,1.5945599555969239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,1,power_law_1.2,2.3195648193359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,1,power_law_1.2,4.1023296356201175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,1,power_law_1.2,4.332134246826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,1,power_law_1.2,4.598579025268554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,1,power_law_1.2,4.843315124511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,1,power_law_1.2,5.0862079620361325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,1,power_law_1.2,5.10013427734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,1,power_law_1.2,5.216665649414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,1,power_law_1.2,5.210931015014649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,1,power_law_1.2,5.39728012084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,1,power_law_1.2,5.463654327392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,1,power_law_1.2,5.477580642700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,1,power_law_1.2,5.735219192504883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,1,power_law_1.2,5.953945541381836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,1,power_law_1.2,6.149529647827149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,1,power_law_1.2,6.659891510009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,1,power_law_1.2,7.477043151855469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,1,power_law_1.2,8.78182373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,1,power_law_1.2,9.766912078857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,1,power_law_1.2,12.635750579833985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,1,power_law_1.2,15.102156066894532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,1,power_law_1.2,20.393778991699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,1,power_law_1.2,25.836953735351564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,64,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,64,power_law_1.2,0.024352000653743745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,64,power_law_1.2,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,64,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,64,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,64,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,64,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,64,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,64,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,64,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,64,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,32,power_law_1.01,0.4104191780090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,64,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,64,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,32,power_law_1.01,0.37068800926208495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,64,power_law_1.2,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,64,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,32,power_law_1.01,0.3858432054519653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,64,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,32,power_law_1.01,0.37560319900512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,64,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,32,power_law_1.01,0.33607680797576905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,64,power_law_1.2,0.07207679748535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,64,power_law_1.2,0.08335360288619995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,32,power_law_1.01,0.3794944047927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,64,power_law_1.2,0.11487360000610351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,32,power_law_1.01,0.32624640464782717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,64,power_law_1.2,0.1994752049446106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,32,power_law_1.01,0.3841856002807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,32,power_law_1.01,0.37396481037139895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,64,power_law_1.2,0.35143680572509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,32,power_law_1.01,0.38727679252624514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,32,power_law_1.01,0.3758080005645752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,32,power_law_1.01,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,32,power_law_1.01,0.38543360233306884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,32,power_law_1.01,0.3901439905166626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,32,power_law_1.01,0.41021437644958497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,32,power_law_1.01,0.416153621673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,32,power_law_1.01,0.42229762077331545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,32,power_law_1.01,0.4745215892791748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,32,power_law_1.01,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,32,power_law_1.01,0.6436863899230957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,32,power_law_1.01,0.7333888053894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,32,power_law_1.01,1.072537612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,32,power_law_1.01,1.3402112007141114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,32,power_law_1.01,2.142617607116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,64,power_law_1.2,0.45465598106384275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,32,power_law_1.01,2.511667251586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,32,power_law_1.01,3.511705780029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,32,power_law_1.01,4.842700958251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,64,power_law_1.2,0.6772736072540283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,64,power_law_1.2,0.9861120223999024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,2,balanced,0.3160746693611145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,2,balanced,0.5433973471323649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,2,balanced,1.0304853121439617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,2,balanced,2.0147199630737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,2,balanced,4.088149388631185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,2,balanced,7.893327713012695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,2,balanced,0.5976746479670206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,2,balanced,1.0390186309814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,2,balanced,2.035711924235026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,2,balanced,11.813716888427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,2,balanced,4.112554550170898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,2,balanced,8.139605204264322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,2,balanced,11.832661946614584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,2,balanced,11.853642781575521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,2,balanced,15.92746607462565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,2,balanced,11.87276840209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,2,balanced,15.941632588704428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,2,balanced,11.90877914428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,2,balanced,15.959210713704428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,2,balanced,11.945098876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,2,balanced,15.965012868245443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,2,balanced,11.979775746663412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,2,balanced,12.037087758382162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,2,balanced,15.989930470784506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,2,balanced,12.09890111287435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,2,balanced,16.01092274983724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,2,balanced,12.150613149007162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,2,balanced,16.03430430094401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,2,balanced,12.255060831705729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,2,balanced,12.432042439778646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,2,balanced,16.07031504313151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,2,balanced,12.576597849527994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,2,balanced,16.11844253540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,2,balanced,12.86963144938151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,2,balanced,16.179882049560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,8,power_law_1.2,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,8,power_law_1.2,0.5242879867553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,2,balanced,13.169663747151693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,8,power_law_1.2,0.5709824085235595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,8,power_law_1.2,0.6582272052764893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,8,power_law_1.2,0.7802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,8,power_law_1.2,0.9285632133483886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,2,balanced,16.241322835286457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,8,power_law_1.2,0.9250816345214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,2,balanced,13.739008585611979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,8,power_law_1.2,0.8366080284118652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,8,power_law_1.2,0.8845312118530273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,8,power_law_1.2,0.9185279846191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,8,power_law_1.2,0.8775679588317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,8,power_law_1.2,0.9308159828186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,2,balanced,16.344404856363933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,8,power_law_1.2,0.9367551803588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,2,balanced,14.34436289469401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,8,power_law_1.2,1.0008576393127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,8,power_law_1.2,1.0221568107604981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,8,power_law_1.2,1.0364928245544434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,8,power_law_1.2,1.1216896057128907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,8,power_law_1.2,1.195417594909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,8,power_law_1.2,1.2003328323364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,2,balanced,17.090389251708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,2,balanced,15.452159881591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,8,power_law_1.2,1.3477888107299805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,8,power_law_1.2,1.5474687576293946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,8,power_law_1.2,1.9515392303466796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,8,power_law_1.2,2.2841344833374024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,2,balanced,17.428138732910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,2,balanced,16.035498301188152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,8,power_law_1.2,3.138355255126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,8,power_law_1.2,3.387392044067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,2,balanced,17.821343739827473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,2,balanced,18.70694351196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,8,power_law_1.2,4.982169723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,8,power_law_1.2,7.143424224853516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,2,balanced,18.492757161458332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,2,balanced,22.188886006673176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,2,balanced,21.59581756591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,2,balanced,24.769877115885418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,2,balanced,25.539072672526043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,1,power_law_1.2,1.1280384063720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,1,power_law_1.2,2.1942272186279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,1,power_law_1.2,4.308966445922851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,2,balanced,25.44708251953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,1,power_law_1.2,6.385254287719727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,1,power_law_1.2,8.968396759033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,2,balanced,28.810923258463543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,1,power_law_1.2,16.78970947265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,2,power_law_1.2,0.20684800148010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,1,power_law_1.2,17.714175415039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,2,power_law_1.2,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,2,power_law_1.2,0.4282368183135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,2,power_law_1.2,0.5318655967712402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,2,power_law_1.2,0.5048319816589355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,2,power_law_1.2,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,2,balanced,34.20091756184896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,2,power_law_1.2,0.5367807865142822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,2,power_law_1.2,0.540876817703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,2,power_law_1.2,0.5498879909515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,2,power_law_1.2,0.5619711875915527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,1,power_law_1.2,17.834393310546876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,2,power_law_1.2,0.5648384094238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,2,power_law_1.2,0.5943295955657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,2,power_law_1.2,0.5801983833312988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,2,power_law_1.2,0.6305791854858398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,2,power_law_1.2,0.6744063854217529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,1,power_law_1.2,19.293798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,2,power_law_1.2,0.719871997833252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,2,power_law_1.2,0.8163328170776367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,2,power_law_1.2,0.9447423934936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,1,power_law_1.2,18.67530212402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,2,power_law_1.2,1.176371192932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,1,power_law_1.2,19.737394714355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,2,power_law_1.2,1.503001594543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,1,power_law_1.2,20.855194091796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,2,power_law_1.2,1.923276710510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,1,power_law_1.2,20.604698181152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,1,power_law_1.2,22.024191284179686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,1,power_law_1.2,22.867762756347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,2,power_law_1.2,2.364825630187988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,1,power_law_1.2,23.212205505371095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,1,power_law_1.2,23.182949829101563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,1,power_law_1.2,24.29539794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,2,power_law_1.2,3.000320053100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,1,power_law_1.2,25.20657958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,8,power_law_1.01,0.03315199911594391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,8,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,8,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,8,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,8,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,8,power_law_1.01,0.04299519956111908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,8,power_law_1.01,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,8,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,8,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,8,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,8,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,8,power_law_1.01,0.07247359752655029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,8,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,8,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,8,power_law_1.01,0.10035200119018554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,1,power_law_1.2,26.988748168945314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,8,power_law_1.01,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,8,power_law_1.01,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,8,power_law_1.01,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,8,power_law_1.01,0.32889599800109864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,8,power_law_1.01,0.4419583797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,8,power_law_1.01,0.8259455680847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,8,power_law_1.01,1.1952128410339355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,2,power_law_1.2,4.662271881103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,8,power_law_1.01,1.7446912765502929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,8,power_law_1.01,2.1817344665527343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,1,power_law_1.2,33.561587524414065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,1,power_law_1.2,38.63572387695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,1,power_law_1.2,36.88652648925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,2,power_law_1.2,5.606399917602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,1,power_law_1.2,45.31773376464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,1,power_law_1.2,51.7865478515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,8,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,8,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,8,balanced,0.1728853384653727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,8,balanced,0.3537919918696086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,8,balanced,0.6830026308695475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,8,balanced,0.6864159901936849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,8,balanced,0.6746400197347006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,8,balanced,0.6763466993967692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,8,balanced,0.6773760318756104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,8,balanced,0.6807893117268881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,8,balanced,0.6847146352132162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,8,balanced,0.6867626508076986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,8,balanced,0.6930773258209229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,8,balanced,0.7017813523610433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,8,balanced,0.7069013118743896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,8,balanced,0.7178239822387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,8,balanced,0.7388160228729248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,8,balanced,0.7604906558990479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,1,power_law_1.2,69.54741821289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,8,balanced,0.8084479967753092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,8,balanced,0.8550399939219157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,8,balanced,0.9173333644866943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,8,balanced,0.9905493259429932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,8,balanced,1.1492693424224854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,8,balanced,1.3385334014892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,8,balanced,1.7582079569498699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,8,balanced,2.2638932863871255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,2,power_law_1.2,7.7305854797363285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,4,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,4,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,4,power_law_1.01,0.21012480258941652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,4,power_law_1.01,0.2570240020751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,4,power_law_1.01,0.3235840082168579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,4,power_law_1.01,0.342630410194397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,4,power_law_1.01,0.4601856231689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,4,power_law_1.01,0.4607999801635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,4,power_law_1.01,0.5062655925750732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,4,power_law_1.01,0.48660478591918943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,4,power_law_1.01,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,4,power_law_1.01,0.5068799972534179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,4,power_law_1.01,0.48906240463256834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,4,power_law_1.01,0.530841588973999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,4,power_law_1.01,0.5242815971374511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,4,power_law_1.01,0.5552000045776367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,4,power_law_1.01,0.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,4,power_law_1.01,0.6658048152923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,4,power_law_1.01,0.7237631797790527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,4,power_law_1.01,0.8435711860656738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,4,power_law_1.01,0.952729606628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,4,power_law_1.01,1.2376064300537108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,4,power_law_1.01,1.56692476272583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,4,power_law_1.01,2.144051170349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,4,power_law_1.01,2.6726400375366213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,4,power_law_1.01,3.945062255859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,4,power_law_1.01,5.3100543975830075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,1,power_law_1.2,86.4468994140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,2,power_law_1.2,12.53949432373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,1,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,1,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,1,power_law_1.01,0.3217407941818237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,1,power_law_1.01,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,1,power_law_1.01,0.9406463623046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,2,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,2,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,2,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,2,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,2,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,1,power_law_1.01,1.3123200416564942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,2,power_law_1.01,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,2,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,1,power_law_1.01,1.5462400436401367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,2,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,2,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,2,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,2,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,1,power_law_1.01,2.0224000930786135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,2,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,2,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,2,power_law_1.01,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,1,power_law_1.01,2.15467529296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,2,power_law_1.01,0.10444799661636353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,1,power_law_1.01,2.182758331298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,2,power_law_1.01,0.09932799935340882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,2,power_law_1.01,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,1,power_law_1.01,2.344140815734863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,2,power_law_1.01,0.2002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,1,power_law_1.01,2.4342527389526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,2,power_law_1.01,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,1,power_law_1.01,2.517401695251465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,1,power_law_1.01,2.571059226989746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,2,power_law_1.01,0.3127295970916748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,1,power_law_1.01,2.672025680541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,1,power_law_1.01,2.7994112014770507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,2,power_law_1.01,0.44748802185058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,1,power_law_1.01,2.8827648162841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,1,power_law_1.01,3.160063934326172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,1,power_law_1.01,3.275980758666992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,1,power_law_1.01,3.7611457824707033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,1,power_law_1.01,4.122828674316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,2,power_law_1.01,0.6334335803985596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,1,power_law_1.01,4.94653434753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,1,power_law_1.01,5.575270462036133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,1,power_law_1.01,7.115366363525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,2,power_law_1.01,0.9095168113708496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,1,power_law_1.01,8.662016296386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,1,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,1,power_law_1.2,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,2,power_law_1.01,1.7133567810058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,1,power_law_1.2,0.36249599456787107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,1,power_law_1.2,0.5687295913696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,1,power_law_1.2,0.7872511863708496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,1,power_law_1.2,1.426022434234619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,1,power_law_1.2,1.532313632965088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,1,power_law_1.01,11.95315170288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,1,power_law_1.2,1.590067195892334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,1,power_law_1.2,1.6623615264892577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,1,power_law_1.2,1.6857088088989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,1,power_law_1.2,1.700864028930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,1,power_law_1.2,1.7692672729492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,1,power_law_1.2,1.8042879104614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,1,power_law_1.2,1.884979248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,1,power_law_1.01,14.695014953613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,1,power_law_1.2,1.8724863052368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,1,power_law_1.2,1.9013631820678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,1,power_law_1.2,1.9752960205078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,1,power_law_1.2,2.0191232681274416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,1,power_law_1.2,2.105958366394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,1,power_law_1.2,2.3597055435180665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,1,power_law_1.2,2.5589759826660154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,1,power_law_1.2,3.0818304061889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,1,power_law_1.2,3.2931838989257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,1,power_law_1.2,4.103577423095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,1,power_law_1.2,4.908236694335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,1,power_law_1.2,6.729523468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,1,power_law_1.2,8.35072021484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,2,power_law_1.01,1.740595245361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,2,power_law_1.01,3.017523193359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.2840192079544067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.5361663818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.8249343872070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,1,power_law_1.2,1.175334358215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,1,power_law_1.2,1.408614444732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,1,power_law_1.2,2.0010623931884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,1,power_law_1.2,2.1176319122314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,1,power_law_1.2,2.1583871841430664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,1,power_law_1.2,2.2597631454467773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,1,power_law_1.2,2.3588863372802735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,2,power_law_1.01,4.169113540649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,1,power_law_1.2,2.4432640075683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,1,power_law_1.2,2.6015743255615233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,1,power_law_1.2,2.7222015380859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,1,power_law_1.2,2.8460927963256837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,1,power_law_1.2,3.0091264724731444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,1,power_law_1.2,3.2661182403564455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,1,power_law_1.2,3.549388885498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,1,power_law_1.2,4.009164810180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,1,power_law_1.2,4.546150588989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,1,power_law_1.2,5.574617767333985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,1,power_law_1.2,6.4753662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,1,power_law_1.2,8.425676727294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,1,power_law_1.2,10.27768325805664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,1,power_law_1.2,14.255500793457031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,1,power_law_1.2,18.084249877929686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,1,balanced,0.06570133566856384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,1,balanced,0.07133866846561432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,1,balanced,0.09181867043177287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,1,balanced,0.2839733362197876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,1,balanced,0.537770668665568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,1,balanced,1.0379947026570637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,1,balanced,1.534122625986735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,1,balanced,1.5322453180948894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,1,balanced,1.5491414070129395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,1,balanced,1.561087926228841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,1,balanced,1.5817386309305828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,1,balanced,1.608191967010498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,1,balanced,1.6252586046854656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,1,balanced,1.6733867327372234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,1,balanced,1.7170772552490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,1,balanced,1.7624746958414714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,1,balanced,1.8520746231079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,1,balanced,2.0560213724772134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,1,balanced,2.29802672068278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,1,balanced,2.7071145375569663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,1,balanced,3.1378774642944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,1,balanced,4.067328135172526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,1,balanced,5.029888153076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,1,balanced,6.896810531616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,1,balanced,8.63761075337728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,1,balanced,12.477099100748697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,1,balanced,15.997269948323568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,4,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,4,power_law_1.2,0.10055680274963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,4,power_law_1.2,0.1439743995666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,4,power_law_1.2,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,4,power_law_1.2,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,4,power_law_1.2,0.38828799724578855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,4,power_law_1.2,0.429260778427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,4,power_law_1.2,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,4,power_law_1.2,0.450764799118042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,4,power_law_1.2,0.440934419631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,4,power_law_1.2,0.45854721069335935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,4,power_law_1.2,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,4,power_law_1.2,0.4976640224456787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,4,power_law_1.2,0.4689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,4,power_law_1.2,0.48578557968139646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,4,power_law_1.2,0.5130239963531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,4,power_law_1.2,0.5066751956939697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,4,power_law_1.2,0.5478400230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,4,power_law_1.2,0.5853184223175049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,4,power_law_1.2,0.6344575881958008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,4,power_law_1.2,0.7383039951324463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,4,power_law_1.2,0.9435135841369628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,4,power_law_1.2,0.9830400466918945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,4,power_law_1.2,1.3012991905212403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,4,power_law_1.2,1.6994304656982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,4,power_law_1.2,2.4166400909423826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,8,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,8,balanced,0.2860373258590698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,8,balanced,0.4720319906870524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,8,balanced,0.9316533406575521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,8,balanced,1.5757652918497722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,8,balanced,2.089130719502767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,8,balanced,2.0991946856180825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,8,balanced,2.097322622934977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,8,balanced,2.100565274556478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,8,balanced,2.10534397761027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,4,power_law_1.2,3.100057601928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,8,balanced,2.1142187118530273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,8,balanced,2.1261653900146484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,8,balanced,2.1317973136901855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,8,balanced,2.1531306902567544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,8,balanced,2.1678080558776855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,8,balanced,2.184021313985189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,8,balanced,2.213205337524414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,8,balanced,2.25655460357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,8,balanced,2.2990506490071616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,8,balanced,2.3683412869771323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,8,balanced,2.4739839235941568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,8,balanced,2.7076266606648765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,8,balanced,2.910037358601888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,8,balanced,3.432618776957194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,8,balanced,3.994112014770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,8,balanced,5.508778889973958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,8,balanced,6.885866800944011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,4,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,4,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,4,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,4,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,4,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,4,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,4,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,4,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,4,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,4,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,4,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,4,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,4,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,4,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,4,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,4,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,4,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,8,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,4,power_law_1.01,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,8,balanced,0.5572266578674316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,8,balanced,0.8792746861775717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,4,power_law_1.01,0.11997439861297607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,8,balanced,1.7955840428670247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,8,balanced,3.0999892552693686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,4,power_law_1.01,0.15872000455856322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,8,balanced,4.208469390869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,8,balanced,4.205909411112468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,8,balanced,4.094805399576823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,4,power_law_1.01,0.1763327956199646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,8,balanced,4.101632118225098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,8,balanced,4.111530621846517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,8,balanced,4.118186632792155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,4,power_law_1.01,0.24309759140014647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,8,balanced,4.134229342142741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,8,balanced,4.148223876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,4,power_law_1.01,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,8,balanced,4.168021202087402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,8,balanced,4.192938804626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,8,balanced,4.211541175842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,8,balanced,4.245845476786296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,8,balanced,4.439551989237468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,8,balanced,4.602026621500651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,8,balanced,4.532224019368489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,8,balanced,4.506112098693848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,8,balanced,4.823040008544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,4,power_law_1.01,0.6014976024627685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,8,balanced,5.0775041580200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,8,balanced,5.7910614013671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,8,balanced,6.401365280151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,8,balanced,8.486741383870443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,8,balanced,10.305194854736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,4,power_law_1.01,0.9502400398254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,2,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,2,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,2,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,2,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,2,power_law_1.2,0.11407359838485717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,2,power_law_1.2,0.17776639461517335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,2,power_law_1.2,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,2,power_law_1.2,0.2883584022521973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,2,power_law_1.2,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,2,power_law_1.2,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,2,power_law_1.2,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,2,power_law_1.2,0.32133119106292723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,2,power_law_1.2,0.3352576017379761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,2,power_law_1.2,0.34140160083770754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,2,power_law_1.2,0.35614719390869143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,2,power_law_1.2,0.3663872003555298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,2,power_law_1.2,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,4,power_law_1.01,1.5104000091552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,2,power_law_1.2,0.43479042053222655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,2,power_law_1.2,0.4759552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,2,power_law_1.2,0.5666816234588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,2,power_law_1.2,0.66211838722229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,2,power_law_1.2,0.8708095550537109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,2,power_law_1.2,1.142784023284912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,2,power_law_1.2,1.6699264526367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,2,power_law_1.2,2.063360023498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,2,power_law_1.2,3.1309823989868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,2,power_law_1.2,4.206796646118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,1,balanced,0.30617600679397583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,1,balanced,0.5309439897537231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,1,balanced,1.0359466870625813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,1,balanced,1.0367999871571858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,1,balanced,1.0347519715627034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,1,balanced,1.0395306746164958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,1,balanced,1.049770673116048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,1,balanced,1.0617173512776692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,1,balanced,1.075541337331136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,1,balanced,1.0806612968444824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,1,balanced,1.0873013337453206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,1,balanced,1.1011412938435872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,1,balanced,1.1079413096110027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,1,balanced,1.2177066802978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,1,balanced,1.1579733689626057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,1,balanced,1.209173361460368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,1,balanced,1.3042346636454265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,1,balanced,1.3422932624816895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,1,balanced,1.4646612803141277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,1,balanced,1.8280107180277507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,1,balanced,2.2374399503072104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,1,balanced,3.1585280100504556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,1,balanced,4.064426740010579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,1,balanced,5.894655863444011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,1,balanced,7.386624018351237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,1,balanced,10.938196818033854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,1,balanced,14.366549173990885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,4,power_law_1.01,2.3260992050170897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,16,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,16,balanced,0.06519466638565063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,16,balanced,0.29576534032821655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,16,balanced,0.5474986632664999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,16,balanced,0.9055573145548502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,16,balanced,1.055573304494222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,16,balanced,1.0587999820709229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,16,balanced,1.0518186887105305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,16,balanced,1.0547200043996174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,16,balanced,1.056938648223877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,16,balanced,1.0618879795074463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,16,balanced,1.0678613185882568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,16,balanced,1.0743146737416585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,16,balanced,1.0825386842091878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,16,balanced,1.0927786827087402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,16,balanced,1.1025066375732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,16,balanced,1.1221333344777424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,16,balanced,1.1661653518676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,16,balanced,1.1979093551635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,16,balanced,1.2545706431070964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,16,balanced,1.3192533651987712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,16,balanced,1.446741263071696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,16,balanced,1.5721813837687175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,16,balanced,2.0838400522867837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,16,balanced,2.3705600102742515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,16,balanced,3.4088961283365884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,16,balanced,4.137301445007324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,2,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,2,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,2,power_law_1.2,0.1019711971282959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,2,power_law_1.2,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,2,power_law_1.2,0.25559039115905763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,2,power_law_1.2,0.3932159900665283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,2,power_law_1.2,0.4200448036193848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,2,power_law_1.2,0.43868160247802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,2,power_law_1.2,0.4515711784362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,2,power_law_1.2,0.44810237884521487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,2,power_law_1.2,0.42557439804077146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,2,power_law_1.2,0.45281281471252444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,2,power_law_1.2,0.454041576385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,2,power_law_1.2,0.4759552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,2,power_law_1.2,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,2,power_law_1.2,0.502784013748169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,2,power_law_1.2,0.510975980758667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,2,power_law_1.2,0.5435391902923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,2,power_law_1.2,0.5521408081054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,2,power_law_1.2,0.6825984001159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,2,power_law_1.2,0.7227392196655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,2,power_law_1.2,0.9660415649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,2,power_law_1.2,1.1692031860351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,2,power_law_1.2,1.6920576095581055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,2,power_law_1.2,1.882521629333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,2,power_law_1.2,2.548736000061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,128,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,128,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,128,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,128,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,128,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,128,balanced,0.031557333966096245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,128,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,128,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,128,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,128,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,128,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,128,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,128,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,128,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,128,balanced,0.03514666606982549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,128,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,128,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,128,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,128,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,128,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,128,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,128,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,128,balanced,0.07970133423805237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,128,balanced,0.10513066252072652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,128,balanced,0.19029333194096884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,128,balanced,0.2930346727371216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,2,power_law_1.2,3.886067199707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,16,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,16,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,16,balanced,0.2955946723620097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,16,balanced,0.5480106671651205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,16,balanced,0.5504000186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,16,balanced,0.5546666781107584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,16,balanced,0.5577386617660522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,16,balanced,0.5584213336308798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,16,balanced,0.5531306664148966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,16,balanced,0.5570559899012247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,16,balanced,0.5608106851577759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,16,balanced,0.5664426485697428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,16,balanced,0.5758293469746908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,16,balanced,0.5831679900487264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,16,balanced,0.59716268380483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,16,balanced,0.624127984046936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,16,balanced,0.6562133232752482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,16,balanced,0.7085973421732584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,16,balanced,0.7565653324127197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,16,balanced,0.8338773250579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,2,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,16,balanced,0.9388373692830404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,2,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,16,balanced,1.1975680192311604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,2,power_law_1.01,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,16,balanced,1.5184213320414226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,2,power_law_1.01,0.35201919078826904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,2,power_law_1.01,0.6170623779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,16,balanced,2.101077397664388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,2,power_law_1.01,0.7636991977691651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,16,balanced,2.677077293395996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,2,power_law_1.01,0.9160703659057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,2,power_law_1.01,1.1063296318054199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,2,power_law_1.01,1.1552767753601074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,2,power_law_1.01,1.1618304252624512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,2,power_law_1.01,1.2525247573852538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,2,power_law_1.01,1.2376064300537108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,2,power_law_1.01,1.2926976203918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,2,power_law_1.01,1.308672046661377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,2,power_law_1.01,1.4446592330932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,2,power_law_1.01,1.4485247611999512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,2,power_law_1.01,1.5747072219848632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,2,power_law_1.01,1.6478208541870116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,2,power_law_1.01,1.7719295501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,2,power_law_1.01,2.043903923034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,2,power_law_1.01,2.3615488052368163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,2,power_law_1.01,2.8702720642089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,2,power_law_1.01,3.309977722167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,2,power_law_1.01,4.421836853027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,2,power_law_1.01,5.613977432250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,2,power_law_1.01,7.728121948242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,2,power_law_1.01,9.662854766845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,2,power_law_1.01,0.6152192115783691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,2,power_law_1.01,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,2,power_law_1.01,1.6136192321777343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,2,power_law_1.01,2.7219839096069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,2,power_law_1.01,3.8799358367919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,2,power_law_1.01,4.6229503631591795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,2,power_law_1.01,6.442393493652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,2,power_law_1.01,6.1962238311767575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,2,power_law_1.01,6.463897705078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,2,power_law_1.01,6.765145874023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,2,power_law_1.01,6.88885726928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,2,power_law_1.01,6.817791748046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,2,power_law_1.01,7.016435241699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,2,power_law_1.01,7.085056304931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,2,power_law_1.01,7.399014282226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,2,power_law_1.01,7.482777404785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,2,power_law_1.01,7.802265930175781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,2,power_law_1.01,8.011980438232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,2,power_law_1.01,8.633344268798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,32,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,32,power_law_1.2,0.037241598963737486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,32,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,32,power_law_1.2,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,2,power_law_1.01,9.012633514404296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,32,power_law_1.2,0.036236798763275145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,32,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,32,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,32,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,32,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,32,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,32,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,32,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,32,power_law_1.2,0.04094719886779785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,2,power_law_1.01,9.546137237548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,32,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,32,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,8,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,32,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,8,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,8,balanced,0.06451199948787689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,8,balanced,0.30498133103052777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,32,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,8,balanced,0.5795573393503824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,32,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,8,balanced,0.7046826680501302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,8,balanced,0.7082666556040446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,32,power_law_1.2,0.07720959782600403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,8,balanced,0.7111679712931315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,32,power_law_1.2,0.09789440035820007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,8,balanced,0.7135573228200277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,8,balanced,0.7156053384145101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,32,power_law_1.2,0.11653120517730713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,8,balanced,0.7202133337656657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,8,balanced,0.7241386572519938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,32,power_law_1.2,0.18532480001449586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,8,balanced,0.7289173603057861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,2,power_law_1.01,10.588365173339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,8,balanced,0.7374506791432699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,32,power_law_1.2,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,8,balanced,0.746666669845581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,8,balanced,0.7567359606424967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,32,power_law_1.2,0.42086400985717776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,8,balanced,0.7719253698984782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,8,balanced,0.802133321762085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,32,power_law_1.2,0.521830415725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,8,balanced,0.8366080125172933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,8,balanced,0.8852266470591227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,8,balanced,0.9425653616587321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,32,power_law_1.2,0.881049633026123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,8,balanced,1.0567680199940999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,8,balanced,1.2100266615549724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,32,power_law_1.2,1.1464703559875489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,2,power_law_1.01,11.887615966796876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,8,balanced,1.559893290201823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,8,balanced,1.9737599690755208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,8,balanced,2.8796586990356445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,8,balanced,3.7459627787272134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,2,power_law_1.01,14.90882568359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,2,power_law_1.01,15.578726196289063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,2,power_law_1.01,20.811366271972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,2,power_law_1.01,25.140223693847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,4,power_law_1.2,0.08048639893531799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,4,power_law_1.2,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,4,power_law_1.2,0.19804160594940184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,4,power_law_1.2,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,4,power_law_1.2,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,4,power_law_1.2,0.24637439250946044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,4,power_law_1.2,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,4,power_law_1.2,0.25722880363464357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,4,power_law_1.2,0.2553855895996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,4,power_law_1.2,0.25620479583740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,4,power_law_1.2,0.26808319091796873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,4,power_law_1.2,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,4,power_law_1.2,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,4,power_law_1.2,0.3264512062072754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,4,power_law_1.2,0.3370879888534546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,4,power_law_1.2,0.34713599681854246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,4,power_law_1.2,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,4,power_law_1.2,0.49356799125671386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,4,power_law_1.2,0.6336512088775634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,4,power_law_1.2,0.8650752067565918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,4,power_law_1.2,1.0940223693847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,4,power_law_1.2,1.6445440292358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,8,balanced,0.2986666758855184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,8,balanced,0.2845013340314229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,8,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,8,balanced,0.2785173257191976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,8,balanced,0.27953600883483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,8,balanced,0.28040534257888794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,8,balanced,0.28228267033894855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,8,balanced,0.2836479942003886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,8,balanced,0.2850133379300435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,8,balanced,0.2863786617914836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,8,balanced,0.29815467198689777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,8,balanced,0.359935998916626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,8,balanced,0.36317865053812665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,8,balanced,0.2998613317807515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,8,balanced,0.3781973520914714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,8,balanced,0.3843413194020589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,8,balanced,0.3408213456471761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,8,balanced,0.44407467047373456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,8,balanced,0.457045316696167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,8,balanced,0.6420480012893677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,8,balanced,0.799402634302775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,8,balanced,1.1663359800974529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,8,balanced,1.4672212600708008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,8,balanced,2.0392746925354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,8,balanced,2.6212639808654785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,8,balanced,3.7114880879720054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,8,balanced,4.844031969706218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,4,power_law_1.2,1.9458047866821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,4,power_law_1.2,2.8000255584716798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,4,power_law_1.2,4.181196975708008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,4,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,4,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,4,power_law_1.01,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,4,power_law_1.01,0.15912959575653077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,4,power_law_1.01,0.21729280948638915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,4,power_law_1.01,0.3299328088760376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,4,power_law_1.01,0.3596287965774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,4,power_law_1.01,0.35287039279937743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,4,power_law_1.01,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,4,power_law_1.01,0.36659200191497804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,4,power_law_1.01,0.364134407043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,4,power_law_1.01,0.3868544101715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,4,power_law_1.01,0.4009984016418457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,4,power_law_1.01,0.41308159828186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,4,power_law_1.01,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,4,power_law_1.01,0.44851198196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,4,power_law_1.01,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,4,power_law_1.01,0.5158912181854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,4,power_law_1.01,0.5464064121246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,4,power_law_1.01,0.6365183830261231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,4,power_law_1.01,0.7935999870300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,4,power_law_1.01,1.0821632385253905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,4,power_law_1.01,1.3320192337036132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,4,power_law_1.01,2.0088832855224608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,4,power_law_1.01,2.6802175521850584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,4,power_law_1.01,3.6284416198730467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,4,power_law_1.01,5.117747116088867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,2,balanced,0.34986666838328045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,2,balanced,0.5879466533660889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,2,balanced,1.1127253373463948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,2,balanced,2.177194595336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,2,balanced,4.322618802388509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,2,balanced,5.375146865844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,2,balanced,5.387264251708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,2,balanced,5.400405248006185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,2,balanced,5.411669413248698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,2,balanced,5.419178644816081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,2,balanced,5.439317067464192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,2,balanced,5.464234670003255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,2,balanced,5.495808283487956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,2,balanced,5.548714955647786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,2,balanced,5.59172248840332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,2,balanced,5.793962478637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,2,balanced,5.867690404256185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,2,balanced,6.003706614176433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,2,balanced,6.110720316569011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,2,balanced,6.989125569661458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,2,balanced,6.438229242960612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,2,balanced,6.894250869750977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,2,balanced,7.4434560139973955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,2,balanced,8.81885846455892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,2,balanced,11.949055989583334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,4,power_law_1.2,6.4716796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,2,balanced,15.071573893229166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,2,balanced,20.034027099609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,4,power_law_1.2,7.049420928955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,4,balanced,0.5253119866053263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,4,balanced,0.5259946584701538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,4,balanced,1.0304853121439617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,4,balanced,1.0374826590220134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,4,balanced,1.0333759784698486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,4,balanced,1.0376533667246501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,4,balanced,1.0516479810078938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,4,balanced,1.0603520075480144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,4,balanced,1.0738240083058674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,4,balanced,1.0777599811553955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,4,balanced,1.0832213560740154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,4,balanced,1.0934613545735676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,4,balanced,1.1001173655192058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,4,balanced,1.1144533157348633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,4,balanced,1.751039981842041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,4,balanced,1.7972906430562336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,4,balanced,1.8399465878804524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,4,balanced,2.5553919474283853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,4,balanced,3.2320852279663086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,4,balanced,4.675242741902669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,32,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,4,balanced,5.612373352050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,32,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,32,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,32,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,32,balanced,0.2402986685434977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,32,balanced,0.24182933568954468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,32,balanced,0.24318399031956991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,32,balanced,0.24352532625198364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,32,balanced,0.244053324063619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,32,balanced,0.244053324063619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,32,balanced,0.24641066789627075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,32,balanced,0.2476373314857483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,32,balanced,0.2500266631444295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,32,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,32,balanced,0.25651200612386066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,32,balanced,0.258730669816335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,4,balanced,7.643637339274089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,32,balanced,0.2645333409309387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,32,balanced,0.27321600914001465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,32,balanced,0.27613866329193115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,32,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,32,balanced,0.30429333448410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,32,balanced,0.3667626778284709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,32,balanced,0.37085866928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,32,balanced,0.49561599890391034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,32,balanced,0.5893119970957438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,4,balanced,9.290239969889322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,32,balanced,0.9357653458913168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,32,balanced,1.2047253449757893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,4,balanced,11.68384043375651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,4,balanced,14.100650787353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,4,balanced,18.412885030110676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,64,power_law_1.2,0.46489601135253905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,64,power_law_1.2,0.41205759048461915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,64,power_law_1.2,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,64,power_law_1.2,0.416153621673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,64,power_law_1.2,0.36863999366760253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,64,power_law_1.2,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,4,balanced,22.228480021158855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,64,power_law_1.2,0.3141632080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,64,power_law_1.2,0.41246719360351564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,64,power_law_1.2,0.3768255949020386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,64,power_law_1.2,0.3655679941177368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,64,power_law_1.2,0.4214784145355225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,64,power_law_1.2,0.3895296096801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,64,power_law_1.2,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,64,power_law_1.2,0.373145604133606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,64,power_law_1.2,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,8,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,8,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,8,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,64,power_law_1.2,0.4374527931213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,8,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,8,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,64,power_law_1.2,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,8,power_law_1.2,0.05242239832878113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,8,power_law_1.2,0.06695680022239685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,64,power_law_1.2,0.481279993057251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,8,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,64,power_law_1.2,0.5261312007904053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,8,power_law_1.2,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,8,power_law_1.2,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,64,power_law_1.2,0.6512320041656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,64,power_law_1.2,0.7237631797790527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,8,power_law_1.2,0.1087488055229187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,64,power_law_1.2,1.0270719528198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,8,power_law_1.2,0.1558527946472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,64,power_law_1.2,1.104691219329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,8,power_law_1.2,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,64,power_law_1.2,1.6445440292358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,64,power_law_1.2,2.2163455963134764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,64,power_law_1.2,3.570073699951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,8,power_law_1.2,0.26398720741271975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,64,power_law_1.2,4.71203842163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,8,power_law_1.2,0.3868607997894287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,8,power_law_1.2,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,8,power_law_1.2,0.7993343830108642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,8,power_law_1.2,1.056768035888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,8,power_law_1.2,1.7047552108764648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,8,power_law_1.2,2.3771135330200197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,1,power_law_1.2,0.445849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,1,power_law_1.2,0.735641622543335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,1,power_law_1.2,1.4233599662780763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,1,power_law_1.2,2.3099391937255858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,1,power_law_1.2,3.0685184478759764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,1,power_law_1.2,5.949631881713867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,1,power_law_1.2,6.422732543945313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,1,power_law_1.2,6.612582397460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,8,power_law_1.2,3.2555007934570312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,1,power_law_1.2,6.848307037353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,1,power_law_1.2,7.085453033447266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,1,power_law_1.2,7.308287811279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,1,power_law_1.2,7.547084808349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,1,power_law_1.2,7.719731140136719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,1,power_law_1.2,7.999488067626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,1,power_law_1.2,8.239718627929687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,1,power_law_1.2,8.272486114501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,1,power_law_1.2,8.551219177246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,1,power_law_1.2,9.137356567382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,1,power_law_1.2,9.56701431274414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,1,power_law_1.2,10.325196838378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,1,power_law_1.2,11.270758056640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,1,power_law_1.2,13.392486572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,2,power_law_1.2,0.3172352075576782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,2,power_law_1.2,0.5468160152435303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,2,power_law_1.2,0.8638463973999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,2,power_law_1.2,1.397760009765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,2,power_law_1.2,2.145075225830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,1,power_law_1.2,14.52359619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,2,power_law_1.2,2.7023359298706056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,2,power_law_1.2,3.292979049682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,2,power_law_1.2,4.290560150146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,1,power_law_1.2,18.335743713378907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,2,power_law_1.2,4.328448104858398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,2,power_law_1.2,4.315955352783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,2,power_law_1.2,4.26063346862793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,2,power_law_1.2,4.376166534423828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,2,power_law_1.2,4.629299163818359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,2,power_law_1.2,4.934656143188477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,2,power_law_1.2,5.06879997253418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,1,power_law_1.2,21.312921142578126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,2,power_law_1.2,5.299609756469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,2,power_law_1.2,5.412863922119141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,2,power_law_1.2,5.81712646484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,2,power_law_1.2,6.08460807800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,1,power_law_1.2,29.62104187011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,2,power_law_1.2,6.613606262207031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,2,power_law_1.2,6.9478401184082035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,2,power_law_1.2,7.81107177734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,2,power_law_1.2,8.491622161865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,2,power_law_1.2,10.813215637207032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,8,power_law_1.2,4.851712036132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,1,power_law_1.2,37.41552734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,2,power_law_1.2,12.828877258300782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,2,power_law_1.2,16.36249542236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,2,power_law_1.2,17.49381103515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,1,power_law_1.01,0.1931264042854309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,1,power_law_1.01,0.37068800926208495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,1,power_law_1.01,0.7096320152282715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,1,power_law_1.01,1.1782079696655274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,1,power_law_1.01,1.702092742919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,1,power_law_1.01,2.8305408477783205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.6072319984436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,1,power_law_1.01,3.0523391723632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,1,power_law_1.2,1.1134976387023925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,1,power_law_1.01,3.216793441772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,1,power_law_1.2,2.185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,1,power_law_1.01,3.203891372680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,1,power_law_1.2,3.3556480407714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,1,power_law_1.01,3.2800769805908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,1,power_law_1.2,4.4994560241699215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,1,power_law_1.01,3.354828643798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,1,power_law_1.01,3.36732177734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,1,power_law_1.2,8.486093139648437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,1,power_law_1.01,3.480985641479492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,1,power_law_1.01,3.59997444152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,1,power_law_1.01,3.644192123413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,1,power_law_1.2,8.608358764648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,1,power_law_1.01,3.703398513793945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,1,power_law_1.01,3.8160385131835937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,1,power_law_1.2,8.961638641357421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,1,power_law_1.01,3.8483966827392577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,1,power_law_1.2,9.602047729492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,1,power_law_1.01,3.9118846893310546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,1,power_law_1.01,4.218227386474609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,1,power_law_1.2,9.567231750488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,1,power_law_1.01,4.629299163818359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,1,power_law_1.01,5.365964889526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,1,power_law_1.2,10.090496063232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,1,power_law_1.01,5.439692687988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,1,power_law_1.2,10.107891082763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,1,power_law_1.01,6.692454528808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,1,power_law_1.01,7.5499519348144535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,1,power_law_1.2,10.349158477783202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,1,power_law_1.01,10.421644592285157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,1,power_law_1.2,10.958643341064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,1,power_law_1.2,11.444019317626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,1,power_law_1.01,12.934349060058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,128,balanced,0.045893331368764244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,128,balanced,0.06997333467006683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,128,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,128,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,128,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,128,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,128,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,128,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,128,balanced,0.056645333766937256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,128,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,128,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,128,balanced,0.0759200006723404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,128,balanced,0.07987200220425923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,128,balanced,0.08584533135096233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,128,balanced,0.08258666594823201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,128,balanced,0.09352533022562663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,128,balanced,0.16742400328318277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,128,balanced,0.21466666460037231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,128,balanced,0.26026666164398193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,1,power_law_1.2,11.433574676513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,128,balanced,0.28706133365631104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,128,balanced,0.3826346794764201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,128,balanced,0.4225706656773885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,128,balanced,0.5292160113652548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,128,balanced,0.6164373159408569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,128,balanced,0.8934400081634521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,1,power_law_1.2,11.824537658691407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,128,balanced,1.1581439971923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,1,power_law_1.2,12.164710235595702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,1,power_law_1.2,12.76231689453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,1,power_law_1.2,13.560012817382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,1,power_law_1.2,15.649996948242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,1,power_law_1.2,18.75169219970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,1,power_law_1.2,18.32366027832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,1,power_law_1.2,22.795878601074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,1,power_law_1.2,27.160369873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,1,power_law_1.2,36.631143188476564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,32,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,32,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,32,balanced,0.1532586713631948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,32,balanced,0.40345601240793866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,32,balanced,0.5654186805089315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,32,balanced,0.5504000186920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,32,balanced,0.5522773265838623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,32,balanced,0.5591040054957072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,32,balanced,0.5604693492253622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,32,balanced,0.5613226493199667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,32,balanced,0.5553493499755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,32,balanced,0.5597866773605347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,32,balanced,0.562175989151001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,32,balanced,0.5671253204345703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,32,balanced,0.5746346712112427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,32,balanced,0.5797546704610189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,32,balanced,0.5920426845550537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,32,balanced,0.615066647529602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,32,balanced,0.637440005938212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,32,balanced,0.6790826320648193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,32,balanced,0.7236266930898031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,32,balanced,0.8275626500447592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,32,balanced,0.9301333427429199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,32,balanced,1.121280034383138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,32,balanced,1.3445119857788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,32,balanced,1.9025920232137044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,32,balanced,2.387114683787028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,1,power_law_1.2,46.20533752441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,2,balanced,0.3433813254038493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,2,balanced,0.5748053391774496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,2,balanced,1.0987520217895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,2,balanced,2.174448013305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,2,balanced,4.3378346761067705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,2,balanced,5.469184239705403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,2,balanced,5.485738754272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,2,balanced,5.343221028645833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,2,balanced,5.356885274251302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,2,balanced,5.370864232381185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,2,balanced,5.3998667399088545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,2,balanced,5.424981435139974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,2,balanced,5.448703765869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,2,balanced,5.493930816650391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,2,balanced,5.535061518351237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,2,balanced,5.576351801554362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,2,balanced,5.642581303914388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,2,balanced,5.794645309448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,2,balanced,5.968213399251302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,2,balanced,6.496085484822591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,2,balanced,6.439568201700847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,2,balanced,6.91490109761556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,2,balanced,7.348565419514974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,2,balanced,9.009493509928385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,2,balanced,10.82589848836263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,2,balanced,15.69382349650065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,2,balanced,19.643904368082683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,4,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,4,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,4,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,4,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,4,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,4,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,4,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,4,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,4,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,4,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,4,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,4,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,4,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,4,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,4,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,4,balanced,0.06229333579540253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,4,balanced,0.06894933183987935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,4,balanced,0.15940266847610474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,4,balanced,0.2310826579729716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,4,balanced,0.32477867603302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,4,balanced,0.4580693244934082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,4,balanced,0.8181760311126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,4,balanced,1.164629300435384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,4,balanced,1.876479943593343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,4,balanced,2.536106745402018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,8,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,8,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,8,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,8,power_law_1.01,0.03704319894313812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,8,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,8,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,8,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,8,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,8,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,8,power_law_1.01,0.050169599056243894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,8,power_law_1.01,0.05774719715118408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,8,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,8,power_law_1.01,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,8,power_law_1.01,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,8,power_law_1.01,0.10178560018539429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,8,power_law_1.01,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,8,power_law_1.01,0.14274560213088988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,8,power_law_1.01,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,8,power_law_1.01,0.21848320960998535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,8,power_law_1.01,0.315391993522644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,8,power_law_1.01,0.48291840553283694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,8,power_law_1.01,0.7473087787628174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,8,power_law_1.01,0.9904128074645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,8,power_law_1.01,1.4559231758117677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.3069632053375244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.578764820098877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.8292032241821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,1,power_law_1.2,1.193779182434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,1,power_law_1.2,2.121721649169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,1,power_law_1.2,2.328985595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,1,power_law_1.2,2.42663688659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,1,power_law_1.2,2.4846336364746096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,1,power_law_1.2,2.6101568222045897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,1,power_law_1.2,2.676326370239258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,1,power_law_1.2,2.740224075317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,1,power_law_1.2,2.7662336349487306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,1,power_law_1.2,2.868838310241699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,1,power_law_1.2,2.960793685913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,1,power_law_1.2,2.9667327880859373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,1,power_law_1.2,3.1303680419921873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,1,power_law_1.2,3.320012664794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,1,power_law_1.2,3.5696640014648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,1,power_law_1.2,3.9614463806152345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,1,power_law_1.2,4.248371124267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,1,power_law_1.2,5.21605110168457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,1,power_law_1.2,6.268108749389649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,1,power_law_1.2,8.46069793701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,1,power_law_1.2,9.860915374755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,8,power_law_1.01,2.2296575546264648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,1,power_law_1.2,13.983334350585938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,8,power_law_1.01,2.897920036315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,2,balanced,0.41369601090749103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,2,balanced,0.7840426762898763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,2,balanced,1.4817280769348145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,2,balanced,3.000149408976237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,2,balanced,5.71238390604655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,2,balanced,8.196095784505209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,2,balanced,8.215375900268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,2,balanced,8.254805246988932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,2,balanced,8.267093022664389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,2,balanced,8.293546676635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,2,balanced,8.312490463256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,2,balanced,8.348330815633139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,2,balanced,8.400042851765951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,2,balanced,8.45909309387207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,2,power_law_1.2,0.19249919652938843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,2,power_law_1.2,0.34938879013061525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,2,power_law_1.2,0.20172159671783446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,2,power_law_1.2,0.49152002334594724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,2,power_law_1.2,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,2,balanced,8.542207717895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,2,power_law_1.2,0.7423999786376954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,2,power_law_1.2,1.131929588317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,2,power_law_1.2,1.4262271881103517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,2,power_law_1.2,0.22855679988861083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,2,balanced,8.609962463378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,2,power_law_1.2,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,2,power_law_1.2,0.44113922119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,2,power_law_1.2,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,2,power_law_1.2,1.9914751052856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,2,power_law_1.2,0.4696000099182129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,2,power_law_1.2,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,2,power_law_1.2,1.8966527938842774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,2,power_law_1.2,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,2,balanced,8.709290822347006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,2,power_law_1.2,0.49745922088623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,2,power_law_1.2,0.4997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,2,power_law_1.2,2.0555776596069335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,1,power_law_1.2,17.942118835449218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,2,power_law_1.2,0.5056511878967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,2,power_law_1.2,0.5005311965942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,2,power_law_1.2,2.140979194641113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,2,power_law_1.2,0.5212160110473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,2,balanced,9.74455451965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,2,power_law_1.2,2.18787841796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,2,power_law_1.2,0.5832704067230224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,2,power_law_1.2,2.1659584045410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,2,power_law_1.2,2.354572868347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,2,balanced,9.337514877319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,2,power_law_1.2,0.61911039352417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,2,power_law_1.2,2.293516731262207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,2,power_law_1.2,2.425856018066406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,2,power_law_1.2,0.6633471965789794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,2,balanced,10.519039789835611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,2,power_law_1.2,2.4330112457275392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,2,power_law_1.2,2.510425567626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,2,power_law_1.2,0.8265536308288575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,2,power_law_1.2,2.6701824188232424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,2,balanced,9.578325271606445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,2,power_law_1.2,2.735910415649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,2,power_law_1.2,2.9497343063354493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,2,power_law_1.2,0.9758720397949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,2,balanced,10.372437159220377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,2,power_law_1.2,3.2425983428955076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,2,power_law_1.2,3.7087230682373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,2,balanced,11.141802469889322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,2,power_law_1.2,4.143910217285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,2,power_law_1.2,5.085593414306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,2,balanced,13.01367441813151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,2,power_law_1.2,1.2443648338317872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,2,power_law_1.2,5.650636672973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,2,power_law_1.2,1.6750591278076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,2,balanced,14.713685353597006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,2,power_law_1.2,7.807366180419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,2,power_law_1.2,10.877337646484374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,2,balanced,20.19908269246419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,2,balanced,24.432810465494793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,2,power_law_1.2,2.4905727386474608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,8,power_law_1.01,4.115852737426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,2,power_law_1.2,2.789376068115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,2,power_law_1.2,4.226867294311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,2,power_law_1.2,6.042214584350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,2,power_law_1.2,0.34140160083770754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,2,power_law_1.2,0.5490687847137451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,2,power_law_1.2,0.6834176063537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,2,power_law_1.2,1.0360832214355469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,2,power_law_1.2,1.0325887680053711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,2,power_law_1.2,1.04202241897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,2,power_law_1.2,1.0559167861938477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,2,power_law_1.2,1.0704895973205566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,2,power_law_1.2,1.1620351791381835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,16,balanced,0.06894933183987935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,16,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,2,power_law_1.2,1.1509759902954102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,16,balanced,0.30702932675679523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,16,balanced,0.5906773408253988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,16,balanced,1.134933312733968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,2,power_law_1.2,1.1810815811157227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,16,balanced,1.3907626469930012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,2,power_law_1.2,1.3280960083007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,16,balanced,1.3955413500467937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,16,balanced,1.3996319770812988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,2,power_law_1.2,1.3567744255065919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,16,balanced,1.3998079299926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,2,power_law_1.2,1.3858816146850585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,16,balanced,1.4035627047220867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,16,balanced,1.4050827026367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,16,balanced,1.4110719362894695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,2,power_law_1.2,1.4764032363891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,16,balanced,1.4167040189107258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,16,balanced,1.422335942586263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,16,balanced,1.4324053128560383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,2,power_law_1.2,1.5654656410217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,16,balanced,1.4769493738810222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,16,balanced,1.4946986834208171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,16,balanced,1.5298560460408528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,2,power_law_1.2,1.742233657836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,16,balanced,1.5520426432291667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,16,balanced,1.7583786646525066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,16,balanced,1.9363840421040852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,16,balanced,2.1394774119059243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,2,power_law_1.2,2.125619125366211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,16,balanced,2.0937387148539224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,16,balanced,2.605738639831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,16,balanced,2.8287998835245767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,16,balanced,4.011349360148112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,2,power_law_1.2,2.7504640579223634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,16,balanced,5.296640078226726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,2,power_law_1.2,3.2473087310791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,2,power_law_1.2,8.644812774658202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,4,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,4,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,4,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,4,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,4,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,2,power_law_1.2,3.792281723022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,4,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,4,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,4,power_law_1.01,0.050988799333572386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,4,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,4,power_law_1.01,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,4,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,4,power_law_1.01,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,4,power_law_1.01,0.10342400074005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,4,power_law_1.01,0.12922879457473754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,4,power_law_1.01,0.14171520471572877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,4,power_law_1.01,0.1662976026535034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,4,power_law_1.01,0.2564095973968506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,2,power_law_1.2,5.443584060668945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,4,power_law_1.01,0.3319616079330444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,4,power_law_1.01,0.43909120559692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,4,power_law_1.01,0.5539840221405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,2,power_law_1.2,6.541721343994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,4,power_law_1.01,0.8515583992004394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,4,power_law_1.01,1.2316672325134277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,4,power_law_1.01,1.7086463928222657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,2,power_law_1.2,9.479782104492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,2,power_law_1.2,10.414694213867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,4,power_law_1.01,2.450636863708496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,2,power_law_1.2,13.094093322753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,4,power_law_1.01,3.6161537170410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,2,power_law_1.2,19.536895751953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,1,power_law_1.2,0.8986623764038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,1,power_law_1.2,1.5003647804260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,1,power_law_1.2,1.8507776260375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,1,power_law_1.2,3.6368385314941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,1,power_law_1.2,3.4631679534912108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,1,power_law_1.2,3.4746368408203123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,1,power_law_1.2,3.4990081787109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,1,power_law_1.2,3.5141632080078127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,1,power_law_1.2,3.752755355834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,1,power_law_1.2,3.760102462768555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,1,power_law_1.2,3.863935852050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,1,power_law_1.2,4.515212631225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,1,power_law_1.2,4.4548095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,1,power_law_1.2,4.592435073852539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,4,power_law_1.01,4.723910522460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,1,power_law_1.2,4.924415969848633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,64,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,64,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,64,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,64,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,64,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,64,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,64,power_law_1.2,0.028646400570869444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,1,power_law_1.2,5.268889617919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,64,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,64,power_law_1.2,0.029657599329948426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,64,power_law_1.2,0.03418880105018616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,64,power_law_1.2,0.04072319865226746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,64,power_law_1.2,0.04769279956817627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,64,power_law_1.2,0.058764797449111936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,64,power_law_1.2,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,64,power_law_1.2,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,1,power_law_1.2,5.784576034545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,64,power_law_1.2,0.1300287961959839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,2,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,2,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,64,power_law_1.2,0.18821120262145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,2,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,2,balanced,0.15974400440851846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,2,balanced,0.3592533270517985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,64,power_law_1.2,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,64,power_law_1.2,0.42597122192382814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,2,balanced,0.48452266057332355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,1,power_law_1.2,7.171071624755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,2,power_law_1.2,22.821670532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,2,balanced,0.48657067616780597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,2,balanced,0.4886186520258586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,2,balanced,0.49134933948516846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,2,balanced,0.4928853511810303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,2,balanced,0.4957866668701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,2,balanced,0.5002239942550659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,2,balanced,0.5039786497751871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,2,balanced,0.5090986490249634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,2,balanced,0.5169493357340494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,2,balanced,0.5220640103022257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,2,balanced,0.5321333408355713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,2,balanced,0.54203200340271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,1,power_law_1.2,8.180531311035157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,2,balanced,0.5667839845021566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,2,balanced,0.6142293214797974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,2,balanced,0.6633706490198771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,2,balanced,0.7929173310597738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,2,balanced,0.9371306896209717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,2,balanced,1.252351999282837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,2,balanced,1.558186690012614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,64,power_law_1.2,0.6082560062408447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,2,balanced,2.223445256551107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,2,balanced,2.827264149983724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,1,power_law_1.2,10.035814666748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,64,power_law_1.2,0.9431039810180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,1,power_law_1.2,11.928781127929687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,64,power_law_1.2,1.4049280166625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,1,power_law_1.2,15.146188354492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,1,power_law_1.2,18.600550842285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,8,power_law_1.2,0.5982207775115966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,8,power_law_1.2,1.0102784156799316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,8,power_law_1.2,1.084620761871338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,8,power_law_1.2,1.2769280433654786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,8,power_law_1.2,1.6336896896362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,8,power_law_1.2,1.4438400268554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,8,power_law_1.2,2.0215808868408205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,8,power_law_1.2,1.4774271965026855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,8,power_law_1.2,1.7526784896850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,8,power_law_1.2,1.743667221069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,8,power_law_1.2,1.8515968322753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,8,power_law_1.2,1.8765823364257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,8,power_law_1.2,1.746124839782715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,8,power_law_1.2,1.8294784545898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,8,power_law_1.2,1.906483268737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,8,power_law_1.2,1.966694450378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,8,power_law_1.2,2.063155174255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,8,power_law_1.2,2.2321151733398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,8,power_law_1.2,2.166764831542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,8,power_law_1.2,2.451251220703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,8,power_law_1.2,2.7508607864379884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,8,power_law_1.2,3.2751617431640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,1,power_law_1.2,24.872755432128905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,8,power_law_1.2,3.8453182220458983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,8,power_law_1.2,4.799897766113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,8,power_law_1.2,5.8193920135498045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,8,power_law_1.2,9.464608001708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,128,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,128,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,128,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,128,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,128,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,128,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,128,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,128,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,8,power_law_1.2,11.036672210693359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,128,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,128,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,128,balanced,0.03531199942032496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,128,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,128,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,128,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,128,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,128,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,128,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,128,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,128,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,128,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,128,balanced,0.0628053347269694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,128,balanced,0.105813334385554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,128,balanced,0.11588266491889954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,128,balanced,0.20667733748753866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,128,balanced,0.293887992699941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,128,balanced,0.4602880080540975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,128,balanced,0.5862400134404501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,1,power_law_1.2,31.697100830078124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,1,power_law_1.2,44.780523681640624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,4,power_law_1.01,0.6057983875274658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,4,power_law_1.01,1.0485759735107423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,4,power_law_1.01,2.043903923034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,4,power_law_1.01,2.0926464080810545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,4,power_law_1.01,3.0295999526977537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,4,power_law_1.01,3.430604934692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,4,power_law_1.01,3.44903678894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,4,power_law_1.01,5.023334503173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,4,power_law_1.01,4.211711883544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,16,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,16,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,4,power_law_1.01,4.403200149536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,16,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,1,power_law_1.2,61.02978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,16,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,16,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,16,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,4,power_law_1.01,4.814233779907227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,16,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,16,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,4,power_law_1.01,5.093580627441407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,16,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,16,power_law_1.2,0.05382400155067444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,16,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,16,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,4,power_law_1.01,4.763647842407226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,16,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,16,power_law_1.2,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,16,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,16,power_law_1.2,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,4,power_law_1.01,4.800716781616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,16,power_law_1.2,0.11878399848937989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,16,power_law_1.2,0.1802240014076233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,16,power_law_1.2,0.2727936029434204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,16,power_law_1.2,0.33218560218811033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,4,power_law_1.01,5.121228790283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,16,power_law_1.2,0.4491263866424561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,16,power_law_1.2,0.6209536075592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,4,power_law_1.01,5.347942352294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,16,power_law_1.2,1.0135552406311035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,16,power_law_1.2,1.3172736167907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,4,power_law_1.01,5.454028701782226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,16,power_law_1.2,2.2249471664428713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,4,power_law_1.01,5.490278244018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,16,power_law_1.2,3.1062015533447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,4,power_law_1.01,6.048972702026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,4,power_law_1.01,5.980774307250977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,4,power_law_1.01,6.538444519042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,4,power_law_1.01,7.097740936279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,4,power_law_1.01,8.040652465820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,4,power_law_1.01,9.32147216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,4,power_law_1.01,11.080703735351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,8,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,8,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,8,power_law_1.2,0.03726080060005188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,8,power_law_1.2,0.03869439959526062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,8,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,8,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,8,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,8,power_law_1.2,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,8,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,8,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,8,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,4,power_law_1.01,15.23609619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,8,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,8,power_law_1.2,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,8,power_law_1.2,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,8,power_law_1.2,0.1218559980392456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,8,power_law_1.2,0.1503167986869812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,8,power_law_1.2,0.1968127965927124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,4,power_law_1.01,15.261080932617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,8,power_law_1.2,0.2232127904891968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,8,power_law_1.2,0.3469311952590942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,8,power_law_1.2,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,4,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,4,balanced,0.06092800199985504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,4,balanced,0.2228906750679016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,4,balanced,0.4164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,4,balanced,0.7551999886830648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,4,balanced,1.0436267058054607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,4,balanced,1.0507946809132893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,4,balanced,1.0548906326293945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,4,balanced,1.05949862798055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,4,balanced,1.0664959748586018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,4,balanced,1.0762240091959636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,4,balanced,1.0856106281280518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,4,balanced,1.0927786827087402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,4,balanced,1.1118933359781902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,4,balanced,1.1313493251800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,4,balanced,1.1475626627604167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,4,balanced,1.1837440331776936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,4,balanced,1.2538879712422688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,4,balanced,1.3325653076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,4,balanced,1.4593547185262044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,4,balanced,1.605120023091634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,4,balanced,1.9374079704284668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,8,power_law_1.2,0.774348783493042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,4,balanced,2.230954647064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,4,balanced,2.925567944844564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,4,balanced,3.6514132817586265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,4,balanced,5.075114568074544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,4,balanced,6.647637049357097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,8,power_law_1.2,1.04202241897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,8,power_law_1.2,1.6273279190063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,8,power_law_1.2,1.803059196472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,32,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,32,balanced,0.042805333932240806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,32,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,32,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,32,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,32,balanced,0.05340800185998281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,32,balanced,0.053898667295773826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,32,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,32,balanced,0.05663999915122986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,32,balanced,0.057333335280418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,32,balanced,0.06126933296521505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,32,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,32,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,32,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,32,balanced,0.09096533060073853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,32,balanced,0.10086400310198466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,32,balanced,0.1725226640701294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,32,balanced,0.21316266059875488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,32,balanced,0.2336426575978597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,32,balanced,0.2775040070215861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,32,balanced,0.32443734010060626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,32,balanced,0.3938666582107544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,32,balanced,0.48144535223642987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,32,balanced,0.6760106881459554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,32,balanced,0.8642559846242269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,32,balanced,1.274880011876424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,32,balanced,1.6708265940348308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,2,power_law_1.01,0.3166208028793335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,2,power_law_1.01,0.5463935852050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,2,power_law_1.01,0.8255488395690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,2,power_law_1.01,1.2978176116943358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,2,power_law_1.01,1.8106367111206054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,2,power_law_1.01,2.4190975189208985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,2,power_law_1.01,3.043737602233887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,2,power_law_1.01,3.1137792587280275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,2,power_law_1.01,3.141427230834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,2,power_law_1.01,3.1698944091796877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,2,power_law_1.01,3.335987091064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,2,power_law_1.01,3.480575942993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,2,power_law_1.01,3.5954689025878905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,2,power_law_1.01,3.7195777893066406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,2,power_law_1.01,3.6622337341308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,2,power_law_1.01,3.8762496948242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,2,power_law_1.01,4.037427139282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,2,power_law_1.01,4.311654281616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,2,power_law_1.01,4.389068984985352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,2,power_law_1.01,4.89349136352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,2,power_law_1.01,5.044633483886718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,2,power_law_1.01,5.7608192443847654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,2,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,2,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,2,power_law_1.01,0.07577599883079529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,2,power_law_1.01,6.277119827270508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,2,power_law_1.01,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,2,power_law_1.01,0.31436800956726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,2,power_law_1.01,0.39915521144866944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,2,power_law_1.01,0.5328896045684814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,2,power_law_1.01,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,2,power_law_1.01,8.387174224853515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,2,power_law_1.01,0.547430419921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,2,power_law_1.01,0.5840896129608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,2,power_law_1.01,0.5675007820129394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,2,power_law_1.01,0.5910528182983399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,2,power_law_1.01,0.6205440044403077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,2,power_law_1.01,0.6348800182342529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,2,power_law_1.01,0.6301504135131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,2,power_law_1.01,9.167257690429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,2,power_law_1.01,0.6600704193115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,2,power_law_1.01,0.6801407814025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,2,power_law_1.01,0.7131135940551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,2,power_law_1.01,0.7962495803833007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,2,power_law_1.01,0.8835071563720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,2,power_law_1.01,0.9963520050048829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,2,power_law_1.01,1.1804672241210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,2,power_law_1.01,12.72442855834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,2,power_law_1.01,1.408614444732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,2,power_law_1.01,1.827225685119629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,2,power_law_1.01,2.1774335861206056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,2,power_law_1.01,3.177881622314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,2,power_law_1.01,16.00122833251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,2,power_law_1.01,3.9946239471435545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,8,power_law_1.2,3.3179264068603516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,8,power_law_1.2,4.242636871337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,32,power_law_1.2,0.6080512046813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,32,power_law_1.2,0.8249343872070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,32,power_law_1.2,0.8210432052612304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,32,power_law_1.2,0.8208383560180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,32,power_law_1.2,0.7575551986694335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,32,power_law_1.2,0.6154240131378174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,32,power_law_1.2,0.6705152034759522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,32,power_law_1.2,0.7178239822387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,32,power_law_1.2,0.667033576965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,32,power_law_1.2,0.7088128089904785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,32,power_law_1.2,0.7352320194244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,32,power_law_1.2,0.8062975883483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,32,power_law_1.2,0.8220288276672363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,32,power_law_1.2,0.8220671653747559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,32,power_law_1.2,0.7753727912902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,1,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,1,power_law_1.01,0.02865920066833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,1,power_law_1.01,0.03213439881801605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,32,power_law_1.2,0.8456192016601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,1,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,1,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,1,power_law_1.01,0.036652800440788266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,32,power_law_1.2,0.8452095985412598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,1,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,1,power_law_1.01,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,1,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,32,power_law_1.2,0.9345024108886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,1,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,1,power_law_1.01,0.05548800230026245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,32,power_law_1.2,0.9248512268066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,1,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,1,power_law_1.01,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,32,power_law_1.2,1.06495361328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,1,power_law_1.01,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,32,power_law_1.2,1.2388352394104003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,1,power_law_1.01,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,1,power_law_1.01,0.12144639492034912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,1,power_law_1.01,0.15544320344924928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,32,power_law_1.2,1.5165439605712892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,32,power_law_1.2,1.8159360885620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,1,power_law_1.01,0.2070528030395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,1,power_law_1.01,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,32,power_law_1.2,2.6695680618286133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,1,power_law_1.01,0.3280895948410034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,32,power_law_1.2,3.4385921478271486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,32,power_law_1.2,4.494131088256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,1,power_law_1.01,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,4,power_law_1.2,0.5464064121246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,4,power_law_1.2,1.0190848350524901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,32,power_law_1.2,7.158988952636719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,4,power_law_1.2,1.248256015777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,4,power_law_1.2,1.5736831665039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,4,power_law_1.2,2.2163135528564455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,4,power_law_1.2,2.388991928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,4,power_law_1.2,3.2956417083740233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,4,power_law_1.2,3.304038238525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,4,power_law_1.2,3.146950340270996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,1,power_law_1.01,0.5611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,4,power_law_1.2,3.270041656494141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,4,power_law_1.2,3.597312164306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,4,power_law_1.2,3.5655681610107424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,4,power_law_1.2,3.4248703002929686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,4,power_law_1.2,3.5278526306152345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,4,power_law_1.2,3.9018177032470702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,4,power_law_1.2,3.868460845947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,1,power_law_1.01,0.7575551986694335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,4,power_law_1.2,4.115865707397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,4,power_law_1.2,4.157849502563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,4,power_law_1.2,4.497612762451172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,4,power_law_1.2,4.807270431518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,4,power_law_1.2,4.838195037841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,2,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,2,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,2,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,2,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,2,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,2,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,2,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,2,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,2,balanced,0.04043200115362803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,2,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,4,power_law_1.2,5.843558502197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,2,balanced,0.04385599990685781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,2,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,2,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,2,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,2,balanced,0.08959999680519104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,2,balanced,0.09250133236249287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,2,balanced,0.0993280013402303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,2,balanced,0.16725333531697592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,2,balanced,0.19045867522557577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,2,balanced,0.26385066906611127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,2,balanced,0.3201706608136495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,2,balanced,0.4437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,2,balanced,0.624127984046936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,2,balanced,0.984058698018392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,4,power_law_1.2,6.522061157226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,2,balanced,1.3387093544006348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,2,balanced,2.013696034749349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,2,balanced,2.7081387837727866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,4,power_law_1.2,9.468294525146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,4,power_law_1.2,9.890611267089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,1,power_law_1.01,1.152409553527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,4,power_law_1.2,13.321626281738281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,4,power_law_1.2,17.21507873535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,1,power_law_1.01,1.5718400001525878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,16,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,16,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,16,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,16,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,16,balanced,0.06673066814740498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,16,balanced,0.20053333044052124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,16,balanced,0.20138667027155557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,16,balanced,0.20206934213638306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,16,balanced,0.2034346659978231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,16,balanced,0.2034346659978231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,16,balanced,0.20514132579167685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,16,balanced,0.20684800545374551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,16,balanced,0.2097439964612325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,16,balanced,0.20992000897725424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,16,balanced,0.21333332856496176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,16,balanced,0.22219733397165933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,16,balanced,0.22715733448664346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,16,balanced,0.23500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,16,balanced,0.2520693341890971
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,16,balanced,0.29713066418965656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,16,balanced,0.30530667304992676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,16,balanced,0.3938986857732137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,16,balanced,0.40857601165771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,16,balanced,0.6031306584676107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,16,balanced,0.808789332707723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,16,balanced,1.1818666458129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,16,balanced,1.5590400695800781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,1,power_law_1.01,2.513510322570801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,4,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,4,balanced,0.046240001916885376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,4,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,4,balanced,0.05426666637261709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,4,balanced,0.06758399804433186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,4,balanced,0.0679253339767456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,4,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,4,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,4,balanced,0.0692799985408783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,4,balanced,0.07850666840871175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,4,balanced,0.1088853379090627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,4,balanced,0.1076800028483073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,4,balanced,0.15718400478363037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,4,balanced,0.1776640017827352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,4,balanced,0.1950719952583313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,4,balanced,0.21026132504145303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,4,balanced,0.2525866627693176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,4,balanced,0.2988373239835103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,4,balanced,0.381440003712972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,4,balanced,0.45943466822306317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,4,balanced,0.6766933600107828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,4,balanced,0.8930986722310384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,4,balanced,1.4615893363952637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,4,balanced,2.041173299153646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,4,balanced,3.118250528971354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,4,balanced,4.155392011006673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,1,power_law_1.01,3.377561569213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,16,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,16,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,16,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,16,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,16,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,16,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,16,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,16,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,16,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,16,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,16,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,16,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,16,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,16,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,16,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,16,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,16,balanced,0.08482133348782857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,16,balanced,0.11281067132949829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,16,balanced,0.17083734273910522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,16,balanced,0.20428800582885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,16,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,16,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,16,balanced,0.44014934698740643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,16,balanced,0.5666133165359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,4,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,4,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,4,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,4,balanced,0.13312000036239624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,4,balanced,0.35123201211293537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,4,balanced,0.6688213348388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,4,balanced,0.6720853646596273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,4,balanced,0.673962672551473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,4,balanced,0.6772053241729736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,4,balanced,0.677717367808024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,4,balanced,0.6821386814117432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,4,balanced,0.6864213148752848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,4,balanced,0.6881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,4,balanced,0.6947840054829916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,4,balanced,0.7043413321177164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,4,balanced,0.7106560071309408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,4,balanced,0.719701369603475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,4,balanced,0.7616853713989258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,4,balanced,0.7862613201141357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,4,balanced,0.8951466878255209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,4,balanced,0.8634026845296224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,4,balanced,0.9728000164031982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,4,balanced,1.0920960108439128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,4,balanced,1.3786452611287434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,4,balanced,1.6414720217386882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,4,balanced,2.2044960657755532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,4,balanced,2.758485476175944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,128,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,128,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,128,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,128,balanced,0.036159999668598175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,128,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,128,balanced,0.03718400001525879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,128,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,128,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,128,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,128,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,128,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,128,balanced,0.04025600105524063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,128,balanced,0.04060266663630804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,128,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,128,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,128,balanced,0.04469866553942362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,128,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,128,balanced,0.05442133545875549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,128,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,128,balanced,0.06365866462389629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,128,balanced,0.07014399766921997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,128,balanced,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,128,balanced,0.10615467031796773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,128,balanced,0.1616213321685791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,128,balanced,0.1925119956334432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,128,balanced,0.35123201211293537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,128,balanced,0.44680531819661456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,2,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,2,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,2,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,2,power_law_1.01,0.06305919885635376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,2,power_law_1.01,0.09277439713478089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,2,power_law_1.01,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,2,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,2,power_law_1.01,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,2,power_law_1.01,0.24330239295959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,2,power_law_1.01,0.2572160005569458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,2,power_law_1.01,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,2,power_law_1.01,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,2,power_law_1.01,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,2,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,2,power_law_1.01,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,2,power_law_1.01,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,2,power_law_1.01,0.38686718940734866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,2,power_law_1.01,0.4493311882019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,2,power_law_1.01,0.5167103767395019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,2,power_law_1.01,0.7055359840393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,2,power_law_1.01,0.9396224021911621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,2,power_law_1.01,1.4073856353759766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,2,power_law_1.01,1.8132991790771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,2,power_law_1.01,2.61529598236084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,2,power_law_1.01,3.5938304901123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,2,power_law_1.01,5.264384078979492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,2,power_law_1.01,6.943328094482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,1,balanced,0.5867520173390707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,1,balanced,1.029802640279134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,1,balanced,2.0196693738301597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,1,balanced,3.97977606455485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,1,balanced,8.138751983642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,1,balanced,15.7392209370931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,1,balanced,15.776256561279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,1,balanced,15.823354085286459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,1,balanced,15.850325266520182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,1,balanced,15.881727854410807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,1,balanced,15.947434743245443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,1,balanced,16.013482411702473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,1,balanced,16.06468327840169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,1,balanced,16.166571299235027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,1,balanced,16.27013905843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,1,balanced,16.35601043701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,1,balanced,16.511316935221355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,1,balanced,16.799381256103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,1,balanced,17.08561070760091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,1,balanced,17.648298899332683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,1,balanced,18.985467274983723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,1,balanced,19.73094431559245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,1,balanced,20.887893676757812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,1,balanced,21.523114522298176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,32,balanced,0.022357332209746044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,32,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,32,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,32,balanced,0.022357332209746044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,32,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,32,balanced,0.023887999355793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,32,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,32,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,32,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,32,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,32,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,32,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,1,balanced,23.964670817057293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,32,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,32,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,32,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,32,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,32,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,32,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,32,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,32,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,32,balanced,0.05323199927806854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,32,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,32,balanced,0.09830400347709656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,32,balanced,0.19473065932591757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,32,balanced,0.3056640028953552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,32,balanced,0.41557331879933673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,1,balanced,32.033793131510414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,1,balanced,39.44379679361979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,8,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,8,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,8,balanced,0.04400533437728882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,8,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,8,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,8,balanced,0.06195199986298879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,8,balanced,0.2201333244641622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,8,balanced,0.2307413419087728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,8,balanced,0.23244800170262656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,8,balanced,0.23534933725992838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,8,balanced,0.2379093368848165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,8,balanced,0.24285866816838583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,8,balanced,0.2461013396581014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,8,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,8,balanced,0.2640213370323181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,8,balanced,0.27064534028371173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,8,balanced,0.2868906656901042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,8,balanced,0.3184533317883809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,8,balanced,0.35140268007914227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,8,balanced,0.3979733387629191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,8,balanced,0.4375893274943034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,8,balanced,0.5587626695632935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,8,balanced,0.706559975941976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,8,balanced,1.0821973482767742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,8,balanced,1.5286614100138347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,8,balanced,2.253653367360433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,8,balanced,2.984959920247396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,4,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,4,balanced,0.032245332996050514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,4,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,4,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,4,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,4,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,4,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,4,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,4,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,4,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,4,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,4,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,4,balanced,0.056320001681645714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,4,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,4,balanced,0.08567466338475545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,4,balanced,0.09403733412424724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,4,balanced,0.08806399504343669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,4,balanced,0.14472533265749613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,4,balanced,0.1634986698627472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,4,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,4,balanced,0.3176106611887614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,4,balanced,0.4399786790211995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,4,balanced,0.572927991549174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,4,balanced,0.8378026485443115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,4,balanced,1.1526827017466228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,4,balanced,1.7402879397074382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,4,balanced,2.358954588572184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,1,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,1,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,1,balanced,0.16401066382726034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,1,balanced,0.3561813433965047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,1,balanced,0.672426700592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,1,balanced,1.3149867057800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,1,balanced,1.3219839731852214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,4,power_law_1.2,0.19537919759750366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,1,balanced,1.327957312266032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,4,power_law_1.2,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,1,balanced,1.3370025952657063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,4,power_law_1.2,0.3551232099533081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,1,balanced,1.3414400418599446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,4,power_law_1.2,0.472441577911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,1,balanced,1.3499733606974285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,4,power_law_1.2,0.44359679222106935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,4,power_law_1.2,0.743833589553833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,1,balanced,1.3620905876159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,4,power_law_1.2,0.7802879810333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,1,balanced,1.3718187014261882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,4,power_law_1.2,0.8146944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,1,balanced,1.3912746111551921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,1,balanced,1.41156800587972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,4,power_law_1.2,0.9125887870788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,1,balanced,1.4315519332885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,4,power_law_1.2,0.8400896072387696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,1,balanced,1.4713013966878254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,4,power_law_1.2,0.908083152770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,1,balanced,1.5517013867696126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,4,power_law_1.2,0.861184024810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,1,balanced,1.6341333389282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,4,power_law_1.2,0.9521151542663574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,1,balanced,1.7805546124776204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,4,power_law_1.2,0.9533439636230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,1,balanced,1.9660800298055012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,4,power_law_1.2,0.9631744384765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,1,balanced,2.313706715901693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,4,power_law_1.2,0.8927231788635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,4,power_law_1.2,0.9963456153869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,1,balanced,2.6192213694254556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,4,power_law_1.2,1.0147839546203614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,4,power_law_1.2,1.105510425567627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,1,balanced,3.2442026138305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,4,power_law_1.2,1.1829248428344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,4,power_law_1.2,1.3928447723388673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,1,balanced,3.9249919255574546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,4,power_law_1.2,1.7821695327758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,4,power_law_1.2,1.9492479324340821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,1,balanced,5.287594795227051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,4,power_law_1.2,2.7453439712524412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,1,balanced,6.910122553507487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,2,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,2,power_law_1.2,0.1621888041496277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,2,power_law_1.2,0.25292799472808836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,2,power_law_1.2,0.4024320125579834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,2,power_law_1.2,0.5163008213043213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,2,power_law_1.2,0.6637567996978759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,2,power_law_1.2,1.0117119789123534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,4,power_law_1.2,2.814361572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,2,power_law_1.2,1.0133503913879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,2,power_law_1.2,1.0334207534790039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,4,power_law_1.2,3.4981822967529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,2,power_law_1.2,1.0602496147155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,2,power_law_1.2,1.1026432037353515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,2,power_law_1.2,1.1341823577880858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,2,power_law_1.2,1.1653120040893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,4,power_law_1.2,4.8437248229980465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,2,power_law_1.2,1.2201984405517579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,2,power_law_1.2,1.231052780151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,2,power_law_1.2,1.2990464210510253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,2,power_law_1.2,1.2914688110351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,2,power_law_1.2,1.4264320373535155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,2,power_law_1.2,1.4729215621948242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,2,power_law_1.2,1.6168960571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,2,power_law_1.2,1.7573888778686524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,2,power_law_1.2,2.08670711517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,2,power_law_1.2,2.30010871887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,2,power_law_1.2,3.0468095779418944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,2,power_law_1.2,3.6571136474609376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,2,power_law_1.2,4.755660629272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,2,power_law_1.2,6.065766525268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.32071681022644044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.5476352214813233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,1,power_law_1.2,1.0346495628356933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,1,power_law_1.2,1.8728960037231446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,1,power_law_1.2,2.774425506591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,1,power_law_1.2,3.789004898071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,1,power_law_1.2,5.6993663787841795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,1,power_law_1.2,6.017228698730468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,1,power_law_1.2,6.363545608520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,1,power_law_1.2,6.429695892333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,1,power_law_1.2,6.7346435546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,1,power_law_1.2,6.803250885009765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,1,power_law_1.2,6.914867401123047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,1,power_law_1.2,7.455129241943359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,1,power_law_1.2,7.682457733154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,1,power_law_1.2,7.714201354980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,1,power_law_1.2,7.998258972167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,1,power_law_1.2,8.778137969970704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,1,power_law_1.2,9.076531219482423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,1,power_law_1.2,9.699942779541015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,1,power_law_1.2,10.02782745361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,1,power_law_1.2,11.706368255615235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,1,power_law_1.2,12.922463989257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,1,power_law_1.2,16.635903930664064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,4,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,4,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,4,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,4,power_law_1.01,0.030483201146125793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,4,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,4,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,4,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,4,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,4,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,1,power_law_1.2,17.877810668945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,1,balanced,0.17749333381652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,4,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,1,balanced,0.38707200686136883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,4,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,1,balanced,0.7336853345235189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,4,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,1,balanced,1.418922742207845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,4,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,4,power_law_1.01,0.0442111998796463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,1,balanced,2.743808110555013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,4,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,4,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,4,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,1,balanced,4.035584131876628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,4,power_law_1.01,0.08663039803504943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,4,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,1,balanced,4.058282534281413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,4,power_law_1.01,0.1810431957244873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,1,balanced,4.079786618550618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,1,balanced,4.104703903198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,1,balanced,4.1260372797648115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,1,power_law_1.2,23.962623596191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,1,balanced,4.166144053141276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,1,balanced,4.206250508626302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,4,power_law_1.01,0.26664960384368896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,1,balanced,4.243626594543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,1,balanced,4.316842714945476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,1,balanced,4.388693491617839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,1,balanced,4.456960042317708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,1,balanced,4.597077369689941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,1,balanced,4.8660478591918945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,1,power_law_1.2,29.520486450195314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,1,balanced,5.132800102233887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,4,power_law_1.01,0.3985408067703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,1,balanced,5.820757548014323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,1,balanced,6.131882349650065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,1,balanced,7.213055928548177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,1,balanced,8.218095779418945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,4,power_law_1.01,0.501964807510376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,1,balanced,11.203924814860025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,1,balanced,12.670976003011068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,32,power_law_1.01,0.33011839389801023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,32,power_law_1.01,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,32,power_law_1.01,0.29736320972442626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,32,power_law_1.01,0.30064640045166013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,32,power_law_1.01,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,1,balanced,18.11302439371745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,32,power_law_1.01,0.26869759559631345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,32,power_law_1.01,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,32,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,32,power_law_1.01,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,32,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,32,power_law_1.01,0.3014656066894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,32,power_law_1.01,0.3235840082168579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,32,power_law_1.01,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,32,power_law_1.01,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,32,power_law_1.01,0.32522239685058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,32,power_law_1.01,0.3295232057571411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,32,power_law_1.01,0.3373055934906006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,1,balanced,23.199745178222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,32,power_law_1.01,0.3631103992462158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,4,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,4,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,4,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,32,power_law_1.01,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,4,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,4,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,4,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,32,power_law_1.01,0.4186111927032471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,4,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,4,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,32,power_law_1.01,0.5144576072692871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,4,power_law_1.01,0.8994815826416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,32,power_law_1.01,0.6670271873474121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,32,power_law_1.01,0.81080322265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,4,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,4,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,4,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,4,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,4,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,4,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,4,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,4,power_law_1.01,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,4,power_law_1.01,0.09563519954681396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,4,power_law_1.01,0.11816960573196411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,32,power_law_1.01,1.1833344459533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,4,power_law_1.01,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,32,power_law_1.01,1.4624768257141114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,32,power_law_1.01,2.1295103073120116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,4,power_law_1.01,0.2590719938278198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,32,power_law_1.01,2.9882368087768554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,4,power_law_1.01,0.38338561058044435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,4,power_law_1.01,0.5343232154846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,4,power_law_1.01,0.7045119762420654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,4,power_law_1.01,1.0539008140563966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,4,power_law_1.01,1.1849727630615234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,4,power_law_1.01,1.5951871871948242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,4,power_law_1.01,1.8108415603637695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,4,power_law_1.01,2.4416255950927734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,4,power_law_1.01,2.5780223846435546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,4,power_law_1.01,3.083673667907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,2,power_law_1.2,0.03048959970474243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,2,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,2,power_law_1.2,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,2,power_law_1.2,0.18677760362625123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,2,power_law_1.2,0.23244800567626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,2,power_law_1.2,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,2,power_law_1.2,0.40325121879577636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,2,power_law_1.2,0.4186111927032471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,2,power_law_1.2,0.44216318130493165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,2,power_law_1.2,0.4567039966583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,2,power_law_1.2,0.46243839263916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,2,power_law_1.2,0.46919679641723633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,2,power_law_1.2,0.4823040008544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,2,power_law_1.2,0.49640960693359376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,2,power_law_1.2,0.5048319816589355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,2,power_law_1.2,0.510975980758667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,2,power_law_1.2,0.5279744148254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,2,power_law_1.2,0.5736447811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,2,power_law_1.2,0.5947391986846924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,2,power_law_1.2,0.6875135898590088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,2,power_law_1.2,0.7694143772125244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,2,power_law_1.2,0.8953856468200684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,2,power_law_1.2,1.1538432121276856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,2,power_law_1.2,1.5056703567504883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,4,balanced,0.2711893320083618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,4,balanced,0.2397866646448771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,4,balanced,0.46745598316192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,4,balanced,0.4684799909591675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,4,balanced,0.4700160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,4,balanced,0.47274665037790936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,4,balanced,0.4747946659723918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,4,balanced,0.47650134563446045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,4,balanced,0.482474684715271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,4,balanced,0.48366932074228924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,4,balanced,0.49032533168792725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,4,balanced,0.5084160168965658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,2,power_law_1.2,1.903411293029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,4,balanced,0.5113120079040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,4,balanced,0.5183146794637045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,4,balanced,0.5309439897537231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,4,balanced,0.5425493319829305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,4,balanced,0.5775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,2,power_law_1.2,2.7430912017822267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,4,balanced,0.8212479750315348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,4,balanced,0.866645336151123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,4,balanced,1.0881653626759846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,4,balanced,1.3226666450500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,4,balanced,1.7365333239237468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,4,balanced,2.090832074483236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,4,balanced,3.003391901652018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,4,balanced,3.8959786097208657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,4,balanced,5.392042795817058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,4,balanced,7.085226694742839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,2,power_law_1.2,3.279667282104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,8,power_law_1.01,1.0885120391845704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,8,power_law_1.01,2.108620834350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,8,power_law_1.01,2.8915712356567385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,8,power_law_1.01,2.315059280395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,8,power_law_1.01,3.769753646850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,8,power_law_1.01,3.3558528900146483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,8,power_law_1.01,3.297280120849609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,8,power_law_1.01,3.4871295928955077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,8,power_law_1.01,3.340902328491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,8,power_law_1.01,3.5432449340820313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,8,power_law_1.01,3.5123199462890624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,8,power_law_1.01,3.648102569580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,8,power_law_1.01,3.6861953735351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,8,power_law_1.01,3.615737533569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,8,power_law_1.01,4.017561721801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,8,power_law_1.01,3.643596649169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,8,power_law_1.2,0.22609920501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,8,power_law_1.01,3.936665725708008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,8,power_law_1.2,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,2,power_law_1.01,1.2681216239929198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,8,power_law_1.2,0.27832319736480715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,8,power_law_1.2,0.39444479942321775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,2,power_law_1.01,2.2163455963134764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,8,power_law_1.2,0.26029438972473146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,8,power_law_1.01,4.124870300292969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,8,power_law_1.2,0.4345856189727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,2,power_law_1.01,2.4920064926147463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,8,power_law_1.2,0.4380671977996826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,8,power_law_1.2,0.450764799118042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,8,power_law_1.01,4.4931072235107425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,8,power_law_1.2,0.42414078712463377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,2,power_law_1.01,3.2409599304199217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,8,power_law_1.2,0.43683838844299316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,8,power_law_1.2,0.46735358238220215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,8,power_law_1.2,0.45424637794494627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,2,power_law_1.01,3.505971145629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,8,power_law_1.2,0.4544511795043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,8,power_law_1.01,4.663910293579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,8,power_law_1.2,0.46592001914978026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,8,power_law_1.2,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,2,power_law_1.01,3.541401672363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,8,power_law_1.2,0.4933631896972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,8,power_law_1.2,0.5156864166259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,8,power_law_1.01,4.961689758300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,2,power_law_1.01,3.7072895050048826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,2,power_law_1.01,4.434316635131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,8,power_law_1.2,0.5701568126678467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,8,power_law_1.01,5.914828872680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,8,power_law_1.2,0.5963776111602783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,8,power_law_1.2,0.6782976150512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,2,power_law_1.01,5.049753570556641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,8,power_law_1.2,0.8112128257751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,8,power_law_1.01,7.035699462890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,2,power_law_1.01,5.1353599548339846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,2,power_law_1.01,4.553523254394531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,8,power_law_1.01,9.619046020507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,2,power_law_1.01,5.381119918823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,8,power_law_1.2,1.0960895538330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,2,power_law_1.01,5.901721572875976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,8,power_law_1.01,9.42366714477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,2,power_law_1.01,6.5867774963378904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,8,power_law_1.2,1.5155200004577636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,8,power_law_1.2,1.9922943115234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,2,power_law_1.01,7.306649780273437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,8,power_law_1.01,13.420748901367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,2,power_law_1.01,7.902381134033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,8,power_law_1.2,2.7109376907348635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,2,power_law_1.01,10.030079650878907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,8,power_law_1.01,16.243096923828126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,2,power_law_1.01,12.902195739746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,2,power_law_1.01,16.00061492919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,8,power_law_1.2,3.8916095733642577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,2,power_law_1.01,20.815667724609376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,2,power_law_1.01,25.115647888183595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,32,power_law_1.01,0.05588480234146118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,32,power_law_1.01,0.049318400025367734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,32,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,32,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,32,power_law_1.01,0.04750719964504242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,8,power_law_1.2,4.526694488525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,32,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,32,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,32,power_law_1.01,0.049542400240898135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,32,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,32,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,8,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,32,power_law_1.01,0.052832001447677614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,32,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,8,power_law_1.01,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,32,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,8,power_law_1.01,0.1347584009170532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,8,power_law_1.01,0.1052672028541565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,32,power_law_1.01,0.058956801891326904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,2,power_law_1.01,29.648486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,8,power_law_1.01,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,32,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,8,power_law_1.01,0.2238464117050171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,32,power_law_1.01,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,8,power_law_1.01,0.21237759590148925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,32,power_law_1.01,0.0800704002380371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,8,power_law_1.01,0.23470079898834229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,8,power_law_1.01,0.2303999900817871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,32,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,8,power_law_1.01,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,32,power_law_1.01,0.20582399368286133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,8,power_law_1.01,0.23265280723571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,32,power_law_1.01,0.26664960384368896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,8,power_law_1.01,0.24023039340972902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,8,power_law_1.01,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,32,power_law_1.01,0.37212159633636477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,8,power_law_1.01,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,8,power_law_1.01,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,32,power_law_1.01,0.47964158058166506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,8,power_law_1.01,0.26213760375976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,8,power_law_1.01,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,32,power_law_1.01,0.7806719779968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,8,power_law_1.01,0.29409279823303225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,8,power_law_1.01,0.33505280017852784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,32,power_law_1.01,0.9779199600219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,8,power_law_1.01,0.4087808132171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,8,power_law_1.01,0.5582848072052002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,8,power_law_1.01,0.7448575973510743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,32,power_law_1.01,1.600102424621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,8,power_law_1.01,1.1134976387023925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,32,power_law_1.01,2.2575103759765627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,8,power_law_1.01,1.4000127792358399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,8,power_law_1.01,1.9759103775024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,8,power_law_1.01,3.0001152038574217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,2,power_law_1.01,36.60369873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,4,power_law_1.2,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,2,power_law_1.01,47.166445922851565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,4,power_law_1.2,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,4,power_law_1.2,0.5677055835723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,4,power_law_1.2,0.9168895721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,4,power_law_1.2,1.1229184150695801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,4,power_law_1.2,1.3752320289611817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,4,power_law_1.2,1.862656021118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,4,power_law_1.2,1.732383918762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,4,power_law_1.2,1.660313606262207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,4,power_law_1.2,1.7164287567138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,4,power_law_1.2,1.6652288436889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,4,power_law_1.2,1.8685951232910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,4,power_law_1.2,1.940070343017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,4,power_law_1.2,1.8049024581909179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,4,power_law_1.2,1.9906560897827148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,4,balanced,0.5111466646194458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,4,balanced,0.45789865652720135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,4,power_law_1.2,1.9173376083374023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,4,balanced,0.8927573362986246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,4,balanced,0.9381546974182129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,4,balanced,0.8953173160552979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,4,power_law_1.2,2.0543487548828123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,4,balanced,0.9041919708251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,4,balanced,0.9117013613382975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,4,balanced,0.9117013613382975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,4,power_law_1.2,2.177024078369141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,4,balanced,0.9135786692301432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,4,balanced,0.9204053084055582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,4,balanced,0.9280853271484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,4,balanced,0.934229294459025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,4,power_law_1.2,2.1997568130493166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,4,balanced,0.9453226725260416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,4,balanced,1.016319990158081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,4,balanced,1.0628853638966878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,4,power_law_1.2,2.395955276489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,4,balanced,1.0775893529256184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,4,balanced,1.0830506483713787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,4,balanced,1.7474560737609863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,4,power_law_1.2,2.5997312545776365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,4,balanced,1.897813320159912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,4,balanced,2.5376267433166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,4,power_law_1.2,3.1670272827148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,4,balanced,3.4051411946614585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,4,power_law_1.2,3.56126708984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,4,balanced,4.63428274790446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,4,power_law_1.2,4.572774505615234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,4,balanced,5.893802642822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,4,power_law_1.2,5.700403213500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,4,balanced,7.666175842285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,4,balanced,9.710592269897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,4,power_law_1.2,7.8000129699707035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,2,power_law_1.01,51.121331787109376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,4,balanced,13.11675771077474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,4,power_law_1.2,9.593651580810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,2,power_law_1.2,0.33075199127197263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,2,power_law_1.2,0.5480447769165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,2,power_law_1.2,0.7034880161285401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,2,power_law_1.2,1.2662400245666503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,4,balanced,16.438613891601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,2,power_law_1.2,1.7123327255249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,2,power_law_1.2,2.145478439331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,2,power_law_1.2,3.0062591552734377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,2,power_law_1.2,3.240140914916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,2,power_law_1.2,3.61267204284668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,2,power_law_1.2,3.3357822418212892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,2,power_law_1.2,3.4686656951904298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,2,power_law_1.2,3.4439167022705077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,2,power_law_1.2,3.5782657623291017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,2,power_law_1.2,3.65588493347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,2,power_law_1.2,3.8512641906738283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,2,power_law_1.2,3.8833919525146485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,2,power_law_1.2,3.830374526977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,2,power_law_1.2,4.2356414794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,2,power_law_1.2,4.482048034667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,2,power_law_1.2,4.773273468017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,2,power_law_1.2,4.931584167480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,2,power_law_1.2,5.58263053894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,2,power_law_1.2,6.464511871337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,2,power_law_1.2,8.712191772460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,2,power_law_1.2,10.101760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,2,power_law_1.2,14.76874237060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,2,power_law_1.2,15.700979614257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,2,power_law_1.01,67.77548828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,2,power_law_1.01,82.6767333984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,64,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,64,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,64,power_law_1.2,0.028863999247550964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,64,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,64,power_law_1.2,0.030508801341056824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,64,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,64,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,64,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,64,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,64,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,64,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,64,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,64,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,64,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,64,power_law_1.2,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,64,power_law_1.2,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,64,power_law_1.2,0.1159168004989624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,64,power_law_1.2,0.13660160303115845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,64,power_law_1.2,0.19148800373077393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,64,power_law_1.2,0.28241920471191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,64,power_law_1.2,0.5107711791992188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,64,power_law_1.2,0.5500927925109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,64,power_law_1.2,0.8642560005187988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,4,power_law_1.2,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,4,power_law_1.2,0.42127361297607424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,4,power_law_1.2,0.33013761043548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,4,power_law_1.2,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,4,power_law_1.2,0.4704256057739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,4,power_law_1.2,0.47656960487365724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,4,power_law_1.2,0.5007359981536865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,4,power_law_1.2,0.5689343929290771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,4,power_law_1.2,0.5150656223297119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,4,power_law_1.2,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,4,power_law_1.2,0.6633471965789794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,4,power_law_1.2,0.6668288230895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,4,power_law_1.2,0.6801407814025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,4,power_law_1.2,0.6905856132507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,4,power_law_1.2,0.7354368209838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,4,power_law_1.2,0.8607744216918946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,4,power_law_1.2,0.910540771484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,4,power_law_1.2,1.0934271812438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,64,power_law_1.2,1.1941887855529785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,4,power_law_1.2,1.2193792343139649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,4,power_law_1.2,1.983078384399414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,4,power_law_1.2,2.1526527404785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,8,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,8,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,8,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,8,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,8,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,8,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,8,balanced,0.034128000338872276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,8,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,8,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,8,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,8,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,8,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,8,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,8,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,8,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,8,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,8,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,8,balanced,0.09011200070381165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,8,balanced,0.08021333316961925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,8,balanced,0.144896000623703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,8,balanced,0.15359999736150107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,8,balanced,0.22613332668940225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,8,balanced,0.29661333560943604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,8,balanced,0.4379306634267171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,8,balanced,0.6125226815541586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,64,power_law_1.2,2.171494483947754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,8,balanced,0.9419093132019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,8,balanced,1.2683946291605632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,4,power_law_1.2,3.3380352020263673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,4,power_law_1.2,3.9606273651123045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,1,balanced,0.27374933163324994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,1,balanced,0.46984533468882245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,1,balanced,0.9064106941223145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,1,balanced,0.9082880020141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,1,balanced,0.9035092989603678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,1,balanced,0.9115306536356608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,1,balanced,0.9180160363515218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,1,balanced,0.9241600036621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,1,balanced,0.9429333209991455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,1,balanced,0.9471999804178873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,1,balanced,0.9572693506876627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,1,balanced,0.9673386414845785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,1,balanced,0.9767253398895264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,1,balanced,0.9927679697672526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,1,balanced,1.1006293296813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,1,balanced,1.1327146689097087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,1,balanced,1.0513066450754802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,1,balanced,1.1504639784495037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,1,balanced,1.2707680066426594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,1,balanced,1.5066453615824382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,1,balanced,1.9191466967264812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,1,balanced,2.847231864929199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,1,balanced,3.631264050801595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,1,balanced,5.224960009256999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,1,balanced,6.837077458699544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,1,balanced,10.207573572794596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,1,balanced,13.292884826660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,64,power_law_1.2,2.453708839416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,4,power_law_1.2,5.250662231445313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,64,power_law_1.01,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,64,power_law_1.01,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,64,power_law_1.01,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,64,power_law_1.01,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,64,power_law_1.01,0.2170880079269409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,64,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,64,power_law_1.01,0.2883584022521973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,64,power_law_1.01,0.25026559829711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,64,power_law_1.01,0.2924479961395264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,64,power_law_1.01,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,64,power_law_1.01,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,64,power_law_1.01,0.2844480037689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,64,power_law_1.01,0.29818880558013916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,64,power_law_1.01,0.2760512113571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,4,power_law_1.2,6.862643432617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,64,power_law_1.01,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,64,power_law_1.01,0.2983936071395874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,64,power_law_1.01,0.32049920558929446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,64,power_law_1.01,0.3407871961593628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,64,power_law_1.01,0.35184640884399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,64,power_law_1.01,0.4286208152770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,64,power_law_1.01,0.5365759849548339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,64,power_law_1.01,0.6610943794250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,64,power_law_1.01,0.932863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,64,power_law_1.01,1.328947162628174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,64,power_law_1.01,1.6510976791381835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,64,power_law_1.01,2.4031232833862304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,64,power_law_1.01,2.807193565368652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,4,power_law_1.2,10.33175048828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,4,power_law_1.2,0.024959999322891235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,4,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,4,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,4,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,4,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,4,power_law_1.2,0.21459200382232665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,4,power_law_1.2,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,4,power_law_1.2,0.18718719482421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,4,power_law_1.2,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,4,power_law_1.2,0.2170559883117676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,4,power_law_1.2,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,4,power_law_1.2,0.24226560592651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,4,power_law_1.2,12.668109130859374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,4,power_law_1.2,0.23203840255737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,4,power_law_1.2,0.24450559616088868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,4,power_law_1.2,0.24227840900421144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,4,power_law_1.2,0.2519040107727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,4,power_law_1.2,0.2541311979293823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,4,power_law_1.2,0.27381761074066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,4,power_law_1.2,0.2846400022506714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,4,power_law_1.2,0.32194559574127196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,4,power_law_1.2,0.35856640338897705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,4,power_law_1.2,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,4,power_law_1.2,0.589414405822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,4,power_law_1.2,0.9828351974487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,4,power_law_1.2,1.192140769958496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,16,power_law_1.2,0.18165760040283202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,16,power_law_1.2,0.35389440059661864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,16,power_law_1.2,0.3325952053070068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,16,power_law_1.2,0.36720640659332277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,16,power_law_1.2,0.35942399501800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,16,power_law_1.2,0.22200319766998292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,16,power_law_1.2,0.31026558876037597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,16,power_law_1.2,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,16,power_law_1.2,0.32133119106292723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,16,power_law_1.2,0.33566720485687257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,16,power_law_1.2,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,16,power_law_1.2,0.34099199771881106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,16,power_law_1.2,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,16,power_law_1.2,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,16,power_law_1.2,0.3338239908218384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,16,power_law_1.2,0.3241791963577271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,16,power_law_1.2,0.3733504056930542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,16,power_law_1.2,0.3987071990966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,16,power_law_1.2,0.4077439785003662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,16,power_law_1.2,0.46448640823364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,16,power_law_1.2,0.5398528099060058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,16,power_law_1.2,0.6561791896820068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,16,power_law_1.2,0.8015872001647949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,16,power_law_1.2,1.1378687858581542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,16,power_law_1.2,1.620172882080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,16,power_law_1.2,2.203443145751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,4,power_law_1.2,1.8132991790771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,16,power_law_1.2,2.5505792617797853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,2,balanced,0.6009173393249512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,2,balanced,1.0357759793599446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,2,balanced,2.042880058288574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,2,balanced,4.116138776143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,2,balanced,7.987541198730469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,2,balanced,15.919787089029947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,2,balanced,23.87609608968099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,2,balanced,23.896746317545574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,2,balanced,23.895894368489582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,4,power_law_1.2,2.447564888000488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,2,balanced,23.913302103678387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,2,balanced,23.94129180908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,2,balanced,23.979685465494793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,2,balanced,24.009557088216145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,2,balanced,24.068267822265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,2,balanced,24.13072967529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,2,balanced,24.186538696289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,2,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,2,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,2,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,2,balanced,0.13958932956059775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,2,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,2,balanced,0.6768639882405599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,2,balanced,0.6816426912943522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,2,balanced,0.67413330078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,2,balanced,0.6789120038350424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,2,balanced,0.6801066398620605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,2,balanced,24.297813415527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,2,balanced,0.6855680147806803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,2,balanced,0.6934186617533366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,2,balanced,0.6976853211720785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,2,balanced,0.7089493274688721
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,2,balanced,0.7179946899414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,2,balanced,0.7287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,2,balanced,0.7464959621429443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,2,balanced,0.7833600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,2,balanced,0.8273920218149821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,2,balanced,24.5567143758138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,2,balanced,0.9091413021087646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,2,balanced,0.9902079900105795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,2,balanced,1.160533348719279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,2,balanced,1.3595306078592937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,2,balanced,1.7397759755452473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,2,balanced,2.1022720336914062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,2,balanced,2.8777812321980796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,2,balanced,25.46056620279948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,2,balanced,3.797674814860026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,2,balanced,25.906005859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,2,balanced,26.58440653483073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,2,balanced,27.327316284179688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,64,power_law_1.2,0.2486272096633911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,64,power_law_1.2,0.2258944034576416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,64,power_law_1.2,0.22691841125488282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,64,power_law_1.2,0.22669439315795897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,64,power_law_1.2,0.1826688051223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,64,power_law_1.2,0.1087488055229187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,64,power_law_1.2,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,64,power_law_1.2,0.2066431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,64,power_law_1.2,0.1271615982055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,64,power_law_1.2,0.17285120487213135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,2,balanced,30.65753682454427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,64,power_law_1.2,0.21790719032287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,64,power_law_1.2,0.2209791898727417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,64,power_law_1.2,0.19230719804763793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,64,power_law_1.2,0.19517439603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,64,power_law_1.2,0.20889599323272706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,64,power_law_1.2,0.22282240390777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,64,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,64,power_law_1.2,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,64,power_law_1.2,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,64,power_law_1.2,0.38461439609527587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,64,power_law_1.2,0.4423679828643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,64,power_law_1.2,0.5414912223815918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,64,power_law_1.2,0.7303167819976807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,64,power_law_1.2,1.0264575958251954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,64,power_law_1.2,1.5577088356018067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,64,power_law_1.2,2.2738943099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,2,balanced,43.260050455729164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,64,power_law_1.2,3.101491165161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,2,balanced,33.49725850423177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,2,balanced,42.72315979003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,2,balanced,39.477760314941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,4,power_law_1.2,0.2559999942779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,4,power_law_1.2,0.26869759559631345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,4,power_law_1.2,0.372326397895813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,4,power_law_1.2,0.5040128231048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,4,power_law_1.2,0.6516736030578614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,4,power_law_1.2,0.780083179473877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,4,power_law_1.2,0.8630271911621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,4,power_law_1.2,0.8316927909851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,4,power_law_1.2,0.8275967597961426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,4,power_law_1.2,0.8656703948974609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,4,power_law_1.2,0.8597503662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,4,power_law_1.2,0.9103360176086426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,4,power_law_1.2,0.8716287612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,4,power_law_1.2,0.8998911857604981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,4,power_law_1.2,0.9215999603271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,4,power_law_1.2,0.9523200035095215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,4,power_law_1.2,0.9953280448913574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,4,power_law_1.2,1.0581888198852538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,4,power_law_1.2,1.124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,4,power_law_1.2,1.308672046661377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,4,power_law_1.2,1.5011839866638184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,4,power_law_1.2,1.9394559860229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,4,power_law_1.2,2.2112064361572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,4,power_law_1.2,3.28089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,4,power_law_1.2,4.09436149597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,16,power_law_1.01,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,16,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,16,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,16,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,16,power_law_1.01,0.034995201230049136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,16,power_law_1.01,0.03500800132751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,16,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,16,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,16,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,16,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,16,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,16,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,16,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,16,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,16,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,16,power_law_1.01,0.06448000073432922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,16,power_law_1.01,0.07680000066757202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,16,power_law_1.01,0.1099776029586792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,16,power_law_1.01,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,16,power_law_1.01,0.32133119106292723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,16,power_law_1.01,0.50032639503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,16,power_law_1.01,0.6563839912414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,16,power_law_1.01,1.1718655586242677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,16,power_law_1.01,1.6228351593017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,4,power_law_1.2,5.698764801025391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,8,power_law_1.01,1.1356160163879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,8,power_law_1.01,1.981439971923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,8,power_law_1.01,1.8065408706665038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,8,power_law_1.01,2.0342784881591798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,8,power_law_1.01,1.6316415786743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,8,power_law_1.01,2.5620479583740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,8,power_law_1.01,2.328780746459961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,8,power_law_1.01,2.5028608322143553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,8,power_law_1.01,2.4610815048217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,8,power_law_1.01,2.4938495635986326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,8,power_law_1.01,2.594803237915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,8,power_law_1.01,2.6441728591918947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,8,power_law_1.01,2.7183103561401367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,8,power_law_1.01,2.7811840057373045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,8,power_law_1.01,2.8010496139526366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,8,power_law_1.01,2.9593599319458006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,8,power_law_1.01,3.238092803955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,8,power_law_1.01,3.2935871124267577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,8,power_law_1.01,3.4342910766601564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,8,power_law_1.01,3.9028736114501954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,8,power_law_1.01,4.89799690246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,8,power_law_1.01,5.687705612182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,8,power_law_1.01,5.600255966186523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,4,power_law_1.2,7.463731384277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,8,power_law_1.01,7.108608245849609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,8,power_law_1.01,9.513369750976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,8,power_law_1.01,12.101427459716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,8,power_law_1.01,15.461581420898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,16,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,16,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,16,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,16,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,16,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,16,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,16,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,16,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,16,power_law_1.2,0.039705601334571836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,16,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,16,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,16,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,16,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,16,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,16,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,16,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,16,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,16,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,16,power_law_1.2,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,16,power_law_1.2,0.09256960153579712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,16,power_law_1.2,0.1134335994720459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,16,power_law_1.2,0.18063360452651978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,16,power_law_1.2,0.28241920471191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,16,power_law_1.2,0.42311677932739256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,16,power_law_1.2,0.5306367874145508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,16,power_law_1.2,0.8994624137878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,16,power_law_1.2,1.3780991554260253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,2,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,2,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,2,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,2,power_law_1.2,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,2,power_law_1.2,0.10567679405212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,2,power_law_1.2,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,2,power_law_1.2,0.24778881072998046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,2,power_law_1.2,0.32276480197906493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,2,power_law_1.2,0.33381760120391846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,2,power_law_1.2,0.3358720064163208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,2,power_law_1.2,0.34406399726867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,2,power_law_1.2,0.3866624116897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,2,power_law_1.2,0.38645761013031005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,2,power_law_1.2,0.41594882011413575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,2,power_law_1.2,0.42841601371765137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,2,power_law_1.2,0.44503040313720704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,2,power_law_1.2,0.4894720077514648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,2,power_law_1.2,0.5777408123016358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,2,power_law_1.2,0.6438911914825439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,2,power_law_1.2,0.861184024810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,2,power_law_1.2,1.082572841644287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,2,power_law_1.2,1.4780415534973144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,2,power_law_1.2,1.9339071273803712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,2,power_law_1.2,2.7488256454467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,2,power_law_1.2,3.6747264862060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,2,power_law_1.2,5.625651168823242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,2,power_law_1.2,7.4635261535644535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,2,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,2,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,2,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,2,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,2,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,2,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,2,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,2,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,2,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,2,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,2,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,2,power_law_1.2,0.03480319976806641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,2,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,2,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,2,power_law_1.2,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,2,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,2,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,2,power_law_1.2,0.07782400250434876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,2,power_law_1.2,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,2,power_law_1.2,0.11919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,2,power_law_1.2,0.19865599870681763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,1,balanced,0.2725546757380168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,1,balanced,0.45585068066914874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,1,balanced,0.8907093207041422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,1,balanced,0.8796160221099854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,1,balanced,0.882858673731486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,1,balanced,0.891050656636556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,1,balanced,0.8948053518931071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,1,balanced,0.9014613628387451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,1,balanced,0.9057280222574869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,1,balanced,0.9127253691355387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,2,power_law_1.2,0.3180543899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,1,balanced,0.9222826957702637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,1,balanced,0.9320106506347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,1,balanced,0.9434453646341959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,1,balanced,0.9823573430379232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,1,balanced,1.0112000306447346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,1,balanced,1.0316800276438396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,1,balanced,1.0395306746164958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,1,balanced,1.1279359658559163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,1,balanced,1.2675413290659587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,1,balanced,1.5769599278767903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,1,balanced,1.9430400530497234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,1,balanced,2.9032106399536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,1,balanced,3.806549390157064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,1,balanced,5.575679779052734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,1,balanced,7.265109380086263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,1,balanced,10.755925496419271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,1,balanced,14.394879659016928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,2,power_law_1.2,0.40529918670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,2,power_law_1.2,0.6201344013214112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,1,power_law_1.2,0.09971839785575867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,1,power_law_1.2,0.22586240768432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,1,power_law_1.2,0.28935039043426514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,1,power_law_1.2,0.5080895900726319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,1,power_law_1.2,0.5249023914337159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,1,power_law_1.2,0.5298175811767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,1,power_law_1.2,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,1,power_law_1.2,0.5353280067443847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,1,power_law_1.2,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,1,power_law_1.2,0.5470208168029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,1,power_law_1.2,0.552953577041626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,1,power_law_1.2,0.5584896087646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,1,power_law_1.2,0.5681151866912841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,1,power_law_1.2,0.5756927967071533
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,1,power_law_1.2,0.597811222076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,1,power_law_1.2,0.6151999950408935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,1,power_law_1.2,0.6873087882995605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,1,power_law_1.2,0.794214391708374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,1,power_law_1.2,0.8673279762268067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,1,power_law_1.2,1.1661312103271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,1,power_law_1.2,1.4106431961059571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,2,power_law_1.2,0.923033618927002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,1,power_law_1.2,2.0346879959106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,1,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,1,power_law_1.01,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,1,power_law_1.01,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,1,power_law_1.01,0.35653760433197024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,1,power_law_1.01,0.4497407913208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,1,power_law_1.01,0.7208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,1,power_law_1.01,0.7831552028656006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,1,power_law_1.01,0.7962624073028565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,1,power_law_1.01,0.8322943687438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,1,power_law_1.01,0.8472576141357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,1,power_law_1.2,2.532966423034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,1,power_law_1.01,0.8626175880432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,1,power_law_1.01,0.8749055862426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,1,power_law_1.01,0.8816320419311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,1,power_law_1.01,0.915231990814209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,1,power_law_1.01,0.9338687896728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,1,power_law_1.01,0.9494272232055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,1,power_law_1.01,0.9803775787353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,1,power_law_1.01,1.0479616165161132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,1,power_law_1.01,1.1149312019348145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,1,power_law_1.01,1.2383999824523926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,1,power_law_1.01,1.3903807640075683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,1,power_law_1.01,1.7295360565185547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,1,power_law_1.01,2.0701183319091796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,1,power_law_1.01,2.777292823791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,1,power_law_1.01,3.308544158935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,1,power_law_1.01,4.645068740844726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,1,power_law_1.01,5.889843368530274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,1,power_law_1.2,3.729395294189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,2,power_law_1.2,1.581670379638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,8,power_law_1.01,0.021689599752426146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,8,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,8,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,8,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,8,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,8,power_law_1.01,0.024780799448490144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,8,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,8,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,8,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,8,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,8,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,8,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,8,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,8,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,8,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,8,power_law_1.01,0.05569919943809509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,8,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,8,power_law_1.01,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,8,power_law_1.01,0.10321919918060303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,8,power_law_1.01,0.13271039724349976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,8,power_law_1.01,0.186572802066803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,8,power_law_1.01,0.32829439640045166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,8,power_law_1.01,0.47513599395751954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,8,power_law_1.01,0.7817215919494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,8,power_law_1.01,1.0891263961791993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,4,power_law_1.01,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,4,power_law_1.01,0.5509119987487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,1,power_law_1.2,4.810547256469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,4,power_law_1.01,1.0565631866455079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,4,power_law_1.01,1.0166272163391112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,4,power_law_1.01,1.4395392417907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,4,power_law_1.01,1.5605759620666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,4,power_law_1.01,1.9769344329833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,4,power_law_1.01,2.4414207458496096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,4,power_law_1.01,2.2149120330810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,4,power_law_1.01,2.411315155029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,4,power_law_1.01,2.369107246398926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,4,power_law_1.01,2.4999935150146486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,4,power_law_1.01,2.5739263534545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,4,power_law_1.01,2.5991167068481444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,4,power_law_1.01,2.789369583129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,4,power_law_1.01,2.787731170654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,4,power_law_1.01,2.6910720825195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,4,power_law_1.01,2.914918327331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,4,power_law_1.01,3.1733760833740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,4,power_law_1.01,3.2176128387451173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,4,power_law_1.01,3.5088382720947267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,4,power_law_1.01,3.808256149291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,4,power_law_1.01,4.17259521484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,2,power_law_1.01,1.0788864135742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,4,power_law_1.01,5.142937469482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,2,power_law_1.01,2.044108772277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,2,power_law_1.01,3.9979007720947264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,4,power_law_1.01,6.3364990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,2,power_law_1.01,5.601260757446289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,4,power_law_1.01,8.200806427001954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,2,power_law_1.01,9.119334411621093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,4,power_law_1.01,9.740493011474609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,2,power_law_1.01,11.475762939453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,1,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,1,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,1,balanced,0.24678399165471396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,1,balanced,0.2469546596209208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,1,balanced,0.24593067169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,1,balanced,0.24729599555333456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,1,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,1,balanced,0.25887467463811237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,1,balanced,0.26077866554260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,1,balanced,0.26316799720128375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,1,balanced,0.265557328859965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,1,balanced,0.27115732431411743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,1,balanced,0.27511467536290485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,1,balanced,0.2739199995994568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,1,balanced,0.2829599976539612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,1,balanced,0.2913279930750529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,1,balanced,0.3211946686108907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,1,balanced,0.36025599638621014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,1,balanced,0.3921866814295451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,1,balanced,0.4604586760203044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,1,balanced,0.5845226844151815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,2,power_law_1.01,13.148570251464843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,1,balanced,0.8872959613800049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,1,balanced,1.2113920052846272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,1,balanced,1.8843305905659993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,1,balanced,2.592426617940267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,1,balanced,4.035925229390462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,1,balanced,5.4348799387613935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,2,power_law_1.01,17.086668395996092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,2,power_law_1.01,17.172274780273437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,2,power_law_1.01,18.422169494628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,2,power_law_1.01,19.1393798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,2,power_law_1.01,19.27843780517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,2,power_law_1.01,19.144499206542967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,2,power_law_1.01,19.563308715820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,1,power_law_1.2,6.847283172607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,2,power_law_1.01,19.482418823242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,2,power_law_1.2,1.8587648391723632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,2,power_law_1.01,20.604518127441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,2,power_law_1.01,21.042752075195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,2,power_law_1.01,22.553190612792967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,2,power_law_1.01,23.8413818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,2,power_law_1.01,25.01099548339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,256,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,256,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,256,balanced,0.039077334105968475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,256,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,256,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,256,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,256,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,256,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,256,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,256,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,256,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,256,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,256,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,256,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,256,balanced,0.04691733419895172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,256,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,256,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,256,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,256,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,256,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,256,balanced,0.0721919983625412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,256,balanced,0.08772266904513042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,256,balanced,0.10496000448862712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,256,balanced,0.16264533003171286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,256,balanced,0.19114667177200317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,256,balanced,0.34884266058603924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,256,balanced,0.44509867827097577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,2,power_law_1.01,26.527130126953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,2,power_law_1.01,28.476824951171874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,2,power_law_1.01,30.839398193359376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,1,power_law_1.2,8.895487976074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,2,power_law_1.01,38.10508728027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,2,power_law_1.01,35.970663452148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,2,power_law_1.01,44.288818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,2,power_law_1.01,50.977996826171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,2,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,2,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,2,power_law_1.01,0.1112064003944397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,2,power_law_1.01,0.2072511911392212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,2,power_law_1.01,0.31395840644836426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,2,power_law_1.01,0.3803136110305786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,2,power_law_1.01,0.4276224136352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,2,power_law_1.01,0.4337471961975098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,2,power_law_1.01,0.4415487766265869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,2,power_law_1.01,0.44994559288024905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,2,power_law_1.01,0.44851198196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,2,power_law_1.01,0.46981120109558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,2,power_law_1.01,0.47656960487365724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,2,power_law_1.01,0.491315221786499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,2,power_law_1.01,0.5029888153076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,2,power_law_1.01,0.5081088066101074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,2,power_law_1.01,0.5345280170440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,2,power_law_1.01,0.5945343971252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,2,power_law_1.01,0.6424575805664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,2,power_law_1.01,0.765331220626831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,2,power_law_1.01,0.9109503746032714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,2,power_law_1.01,1.177190399169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,2,power_law_1.01,1.4608384132385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,2,power_law_1.01,1.9574783325195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,2,power_law_1.01,2.5186304092407226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,2,power_law_1.01,3.691519927978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,2,power_law_1.01,4.789043045043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,32,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,32,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,32,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,32,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,32,balanced,0.0653546651204427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,32,balanced,0.21504000822703043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,32,balanced,0.21606399615605673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,32,balanced,0.21657600005467734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,32,balanced,0.21760000785191855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,32,balanced,0.21862399578094482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,32,balanced,0.22118399540583292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,32,balanced,0.2228906750679016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,32,balanced,0.2259626587231954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,32,balanced,0.2295466661453247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,32,balanced,0.2326186696688334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,32,balanced,0.23910399278004965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,32,balanced,0.250709335009257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,32,balanced,0.2717013359069824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,32,balanced,0.29576534032821655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,32,balanced,0.31726932525634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,32,balanced,0.3677866856257121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,32,balanced,0.4672853151957194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,2,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,32,balanced,0.5824853181838989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,2,power_law_1.01,0.19230719804763793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,32,balanced,0.7284053166707357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,2,power_law_1.01,0.2869247913360596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,2,power_law_1.01,0.45281281471252444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,32,balanced,1.0513066450754802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,2,power_law_1.01,0.6098944187164307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,32,balanced,1.3928106625874836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,2,power_law_1.01,0.7430143833160401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,16,power_law_1.2,0.5879807949066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,16,power_law_1.2,0.6342656135559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,2,power_law_1.01,1.0434559822082519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,16,power_law_1.2,0.6592512130737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,2,power_law_1.01,1.064345645904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,16,power_law_1.2,0.7284736156463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,2,power_law_1.01,1.0598400115966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,16,power_law_1.2,0.5742591857910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,16,power_law_1.2,0.6066175937652588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,2,power_law_1.01,1.0858495712280274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,16,power_law_1.2,0.6782976150512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,2,power_law_1.01,1.1042816162109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,16,power_law_1.2,0.6938623905181884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,16,power_law_1.2,0.7110655784606934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,2,power_law_1.01,1.1220992088317872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,16,power_law_1.2,0.6631423950195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,2,power_law_1.01,1.1790335655212403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,16,power_law_1.2,0.7221248149871826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,2,power_law_1.01,1.217740821838379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,16,power_law_1.2,0.7176064014434814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,16,power_law_1.2,0.7213056087493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,2,power_law_1.01,1.2519424438476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,16,power_law_1.2,0.7475200176239014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,2,power_law_1.01,1.268735980987549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,16,power_law_1.2,0.7643136024475098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,2,power_law_1.01,1.2902400016784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,16,power_law_1.2,0.7671807765960693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,16,power_law_1.2,0.8275967597961426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,2,power_law_1.01,1.4163968086242675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,16,power_law_1.2,0.9226240158081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,2,power_law_1.01,1.3905920028686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,16,power_law_1.2,0.9783231735229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,2,power_law_1.01,1.5220735549926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,16,power_law_1.2,1.1653120040893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,2,power_law_1.01,1.6666624069213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,16,power_law_1.2,1.4462976455688477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,2,power_law_1.01,1.9521535873413085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,16,power_law_1.2,2.0121599197387696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,2,power_law_1.01,2.226585578918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,16,power_law_1.2,2.082406425476074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,2,power_law_1.01,2.9085695266723635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,16,power_law_1.2,3.2217086791992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,2,power_law_1.01,3.2716800689697267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,2,power_law_1.01,4.569292831420898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,2,power_law_1.01,5.8333183288574215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,16,power_law_1.2,4.629504013061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,16,power_law_1.2,6.141952133178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,1,power_law_1.2,0.0446399986743927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,1,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,1,power_law_1.2,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,1,power_law_1.2,0.31989760398864747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,1,power_law_1.2,0.46100478172302245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,1,power_law_1.2,0.6287295818328857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,1,power_law_1.2,0.952729606628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,1,power_law_1.2,1.0203136444091796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,1,power_law_1.2,1.0264575958251954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,1,power_law_1.2,1.0631168365478516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,1,power_law_1.2,1.1171839714050293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,1,power_law_1.2,1.1515904426574708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,1,power_law_1.2,1.1745280265808105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,1,power_law_1.2,1.2388031959533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,1,power_law_1.2,1.2933119773864745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,1,power_law_1.2,1.3064191818237305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,1,power_law_1.2,1.379532814025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,2,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,2,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,2,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,2,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,1,power_law_1.2,1.4858240127563476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,2,balanced,0.2321066657702128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,2,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,2,balanced,0.23654399315516153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,2,balanced,0.23825067281723022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,2,balanced,0.23910399278004965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,2,balanced,0.2404693365097046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,1,power_law_1.2,1.59170560836792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,2,balanced,0.2379093368848165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,2,balanced,0.24132267634073892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,2,balanced,0.242682675520579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,2,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,2,balanced,0.2558293342590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,2,balanced,0.25975465774536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,2,balanced,0.26794666051864624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,1,power_law_1.2,1.785036849975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,2,balanced,0.27989333868026733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,2,balanced,0.3007146716117859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,2,balanced,0.3285333315531413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,2,balanced,0.3643733263015747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,2,balanced,0.47086934248606366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,1,power_law_1.2,1.9508928298950194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,2,balanced,0.6184959808985392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,2,balanced,0.93559463818868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,2,balanced,1.226581335067749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,1,power_law_1.2,2.3922496795654298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,2,balanced,1.8565120697021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,16,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,16,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,16,balanced,0.06229333579540253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,16,balanced,0.3136853377024333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,1,power_law_1.2,2.8010496139526366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,16,balanced,0.37905065218607586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,16,balanced,0.3809279998143514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,2,balanced,2.477205276489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,16,balanced,0.3829760154088338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,16,balanced,0.38417065143585205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,16,balanced,0.3860479990641276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,16,balanced,0.38860801855723065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,16,balanced,0.3915040095647176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,16,balanced,0.39458131790161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,1,power_law_1.2,3.6992961883544924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,16,balanced,0.3998719851175944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,16,balanced,0.4072106679280599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,16,balanced,0.41386667887369794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,16,balanced,0.423253337542216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,16,balanced,0.4456106821695964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,16,balanced,0.47257598241170246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,16,balanced,0.5159253279368082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,16,balanced,0.5478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,1,power_law_1.2,4.469555282592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,16,balanced,0.6140586535135905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,16,balanced,0.7085973421732584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,16,balanced,0.9456640084584554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,16,balanced,1.182207981745402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,1,power_law_1.2,6.3041534423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,16,balanced,1.7783466974894206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,16,balanced,2.356394608815511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,8,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,8,power_law_1.01,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,1,power_law_1.2,7.947468566894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,8,power_law_1.01,0.04607360064983368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,8,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,8,power_law_1.01,0.0595583975315094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,8,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,8,power_law_1.01,0.08048639893531799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,8,power_law_1.01,0.08455680012702942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,8,power_law_1.01,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,8,power_law_1.01,0.10280959606170655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,8,power_law_1.01,0.1325055956840515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,8,power_law_1.01,0.17141760587692262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,8,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,8,power_law_1.01,0.2846719980239868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,8,power_law_1.01,0.43128318786621095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,8,power_law_1.01,0.4982783794403076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,8,power_law_1.01,0.8435392379760742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,8,power_law_1.01,1.0137599945068358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,16,power_law_1.2,8.52459487915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,8,power_law_1.01,1.5437824249267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,8,power_law_1.01,1.9134464263916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,8,power_law_1.01,3.034111976623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,8,power_law_1.01,4.126924896240235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,8,power_law_1.01,6.155059051513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,8,power_law_1.01,8.36157455444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,1,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,1,balanced,0.06092800199985504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,1,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,1,balanced,0.08618666728337605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,1,balanced,0.29661866029103595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,1,balanced,0.5536426703135172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,1,balanced,0.8009066581726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,1,balanced,0.8093012968699137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,1,balanced,0.8202239672342936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,1,balanced,0.8272213141123453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,1,balanced,0.8422400156656901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,1,balanced,0.8618666330973307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,1,balanced,0.8782347043355306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,1,balanced,0.9122133255004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,1,balanced,0.9468533198038737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,1,balanced,0.9777493476867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,1,balanced,1.05403733253479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,1,balanced,1.1929600238800049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,1,balanced,1.3615786234537761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,1,balanced,1.7058134078979492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,1,balanced,2.046293258666992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,1,balanced,2.719914754231771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,1,balanced,3.358037312825521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,1,balanced,4.789930661519368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,1,balanced,6.296576182047526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,1,balanced,9.397759755452475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,1,balanced,12.283220926920572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,4,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,4,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,4,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,4,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,4,power_law_1.01,0.052832001447677614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,4,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,4,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,4,power_law_1.01,0.08048639893531799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,4,power_law_1.01,0.13434879779815673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,4,power_law_1.01,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,4,power_law_1.01,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,4,power_law_1.01,0.14335999488830567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,4,power_law_1.01,0.11939840316772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,4,power_law_1.01,0.14929920434951782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,4,power_law_1.01,0.1820672035217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,4,power_law_1.01,0.17674239873886108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,4,power_law_1.01,0.2070528030395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,4,power_law_1.01,0.22446079254150392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,4,power_law_1.01,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,4,power_law_1.01,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,4,power_law_1.01,0.341593599319458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,4,power_law_1.01,0.4177919864654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,4,power_law_1.01,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,4,power_law_1.01,0.8861696243286132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,4,power_law_1.01,1.1718655586242677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,4,power_law_1.01,1.8360319137573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,4,power_law_1.01,2.4252416610717775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,8,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,8,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,8,balanced,0.2696533401807149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,8,balanced,0.47786664962768555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,8,balanced,0.8023040294647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,8,balanced,1.0615466435750325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,8,balanced,1.053173303604126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,8,balanced,1.0574506918589275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,8,balanced,1.0605226357777913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,8,balanced,1.06496000289917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,8,balanced,1.07042129834493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,8,balanced,1.0781013170878093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,8,balanced,1.0842453638712566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,8,balanced,1.104042689005534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,8,balanced,1.1112106641133626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,8,balanced,1.1224746704101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,8,balanced,1.145855983098348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,8,balanced,1.2006399631500244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,8,balanced,1.2453546524047852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,8,balanced,1.3269333044687908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,8,balanced,1.4079999923706055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,8,balanced,1.610581398010254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,8,balanced,1.8029227256774902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,8,balanced,2.3053654034932456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,8,balanced,2.8035411834716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,8,balanced,3.795114517211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,8,balanced,4.8820905685424805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,4,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,4,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,4,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,4,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,4,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,4,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,4,power_law_1.01,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,4,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,4,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,4,power_law_1.01,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,4,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,4,power_law_1.01,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,4,power_law_1.01,0.09789440035820007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,4,power_law_1.01,0.13332480192184448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,4,power_law_1.01,0.1652735948562622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,4,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,4,power_law_1.01,0.2605056047439575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,4,power_law_1.01,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,4,power_law_1.01,0.38830080032348635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,4,power_law_1.01,0.528384017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,4,power_law_1.01,0.8087552070617676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,4,power_law_1.01,1.0688511848449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,4,power_law_1.01,1.6293760299682618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,32,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,4,power_law_1.01,2.1985279083251954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,32,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,32,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,32,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,32,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,32,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,32,balanced,0.02881066749493281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,32,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,32,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,32,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,32,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,32,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,32,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,32,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,32,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,64,balanced,0.057317331433296204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,32,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,64,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,32,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,64,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,32,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,64,balanced,0.05134933193524679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,4,power_law_1.01,3.4502655029296876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,64,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,32,balanced,0.09112000465393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,32,balanced,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,32,balanced,0.12336533268292744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,32,balanced,0.1628159979979197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,32,balanced,0.28962133328119916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,32,balanced,0.3527573347091675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,4,power_law_1.01,4.552089691162109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,64,balanced,0.28569600979487103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,64,balanced,0.28757333755493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,64,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,64,balanced,0.2908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,64,balanced,0.28996266921361286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,64,balanced,0.2918399969736735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,64,balanced,0.29286400477091473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,64,balanced,0.29474133253097534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,64,balanced,0.29730133215586346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,64,balanced,0.3020640015602112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,64,balanced,0.30427734057108563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,64,balanced,0.31163734197616577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,64,balanced,0.3259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,64,balanced,0.3391146659851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,64,balanced,0.3614720106124878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,64,balanced,0.3868853251139323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,64,balanced,0.4246186812718709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,64,balanced,0.4896426598230998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,64,balanced,0.5980159838994344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,64,balanced,0.7034613291422526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,64,balanced,0.9168213208516439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,64,balanced,1.1864746411641438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,4,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,4,power_law_1.01,0.19456000328063966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,4,power_law_1.01,0.2570240020751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,4,power_law_1.01,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,4,power_law_1.01,0.3950592041015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,4,power_law_1.01,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,4,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,4,power_law_1.01,0.5392384052276611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,4,power_law_1.01,0.6031360149383544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,4,power_law_1.01,0.591648006439209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,4,power_law_1.01,0.5922815799713135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,4,power_law_1.01,0.6107135772705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,4,power_law_1.01,0.6160384178161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,4,power_law_1.01,0.6062079906463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,4,power_law_1.01,0.6338560104370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,4,power_law_1.01,0.6223872184753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,4,power_law_1.01,0.6414336204528809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,4,power_law_1.01,0.7077695846557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,4,power_law_1.01,0.7434239864349366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,4,power_law_1.01,0.8153087615966796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,4,power_law_1.01,0.8683520317077636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,4,power_law_1.01,1.0094464302062989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,4,power_law_1.01,1.207692813873291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,4,power_law_1.01,1.6150527954101563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,4,power_law_1.01,2.005401611328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,4,power_law_1.01,2.757427215576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,4,power_law_1.01,3.4086910247802735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,4,power_law_1.2,0.3477504014968872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,4,power_law_1.2,0.36474881172180174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,4,power_law_1.2,0.5720064163208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,4,power_law_1.2,0.7292928218841552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,4,power_law_1.2,0.7346176147460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,4,power_law_1.2,1.2646400451660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,4,power_law_1.2,1.225932788848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,4,power_law_1.2,1.2171263694763184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,4,power_law_1.2,1.204428768157959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,4,power_law_1.2,1.2195839881896973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,4,power_law_1.2,1.3305855751037599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,4,power_law_1.2,1.3658111572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,4,power_law_1.2,1.3758463859558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,4,power_law_1.2,1.3881343841552733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,4,power_law_1.2,1.4202879905700683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,4,power_law_1.2,1.47128324508667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,4,power_law_1.2,1.5128576278686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,4,power_law_1.2,1.5857600212097167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,4,power_law_1.2,1.6207872390747071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,4,power_law_1.2,1.9208192825317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,4,power_law_1.2,2.071334457397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,4,power_law_1.2,2.7066368103027343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,4,power_law_1.2,3.380633544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,4,power_law_1.2,4.244070434570313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,4,power_law_1.2,5.447257614135742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,4,power_law_1.2,7.533567810058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,64,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,64,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,64,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,64,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,64,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,64,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,64,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,64,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,64,power_law_1.2,0.0566976010799408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,64,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,64,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,64,power_law_1.2,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,64,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,64,power_law_1.2,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,64,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,64,power_law_1.2,0.08540160059928895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,64,power_law_1.2,0.10076160430908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,64,power_law_1.2,0.17428480386734008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,64,power_law_1.2,0.21155838966369628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,4,power_law_1.2,9.694822692871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,64,power_law_1.2,0.2869247913360596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,4,power_law_1.2,0.5091328144073486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,64,power_law_1.2,0.3309312105178833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,4,power_law_1.2,0.7186431884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,4,power_law_1.2,0.5472256183624268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,64,power_law_1.2,0.45137920379638674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,4,power_law_1.2,0.9383935928344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,64,power_law_1.2,0.6002687931060791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,4,power_law_1.2,0.812831974029541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,4,power_law_1.2,0.9056256294250489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,4,power_law_1.2,0.913203239440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,64,power_law_1.2,1.1345919609069823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,4,power_law_1.2,0.9164799690246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,4,power_law_1.2,1.2083200454711913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,4,power_law_1.2,1.1405183792114257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,64,power_law_1.2,1.3529088020324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,4,power_law_1.2,1.3103103637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,4,power_law_1.2,1.3651968002319337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,4,power_law_1.2,1.6246784210205079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,4,power_law_1.2,1.4278656005859376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,4,power_law_1.2,1.794041633605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,4,power_law_1.2,1.8698240280151368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,256,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,256,power_law_1.01,0.03868800103664398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,256,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,4,power_law_1.2,2.2681600570678713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,256,power_law_1.01,0.03889279961585999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,256,power_law_1.01,0.039078399538993835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,256,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,256,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,256,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,4,power_law_1.2,3.2266239166259765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,256,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,256,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,256,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,256,power_law_1.01,0.04668160080909729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,256,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,256,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,256,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,256,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,256,power_law_1.01,0.057126402854919434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,256,power_law_1.01,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,256,power_law_1.01,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,256,power_law_1.01,0.11694079637527466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,256,power_law_1.01,0.1619647979736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,4,power_law_1.2,3.865804672241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,256,power_law_1.01,0.24801280498504638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,256,power_law_1.01,0.3231744050979614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,256,power_law_1.01,0.47472639083862306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,64,power_law_1.2,2.1776384353637694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,256,power_law_1.01,0.7086080074310303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,256,power_law_1.01,1.1190272331237794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,256,power_law_1.01,1.4573439598083495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,64,power_law_1.2,2.7883520126342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,4,power_law_1.2,5.0089984893798825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,4,power_law_1.2,6.2545921325683596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,8,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,8,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,8,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,8,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,8,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,8,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,8,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,8,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,8,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,8,balanced,0.03120533376932144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,8,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,8,balanced,0.0329066663980484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,8,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,8,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,8,balanced,0.05287999908129374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,8,balanced,0.06910400092601776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,8,balanced,0.08120533327261607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,4,power_law_1.2,7.996415710449218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,8,balanced,0.21094399690628052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,8,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,8,balanced,0.4358826478322347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,8,balanced,0.5898240009943644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,8,balanced,0.9050453503926595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,8,balanced,1.239194631576538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,4,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,4,power_law_1.2,10.443366241455077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,4,power_law_1.01,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,4,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,4,power_law_1.01,0.11489280462265014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,4,power_law_1.01,0.2289664030075073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,4,power_law_1.01,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,4,power_law_1.01,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,4,power_law_1.01,0.3506175994873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,4,power_law_1.01,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,4,power_law_1.01,0.3620863914489746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,4,power_law_1.01,0.3299328088760376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,4,power_law_1.01,0.3514240026473999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,4,power_law_1.01,0.3825664043426514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,4,power_law_1.01,0.38686718940734866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,4,power_law_1.01,0.3753983974456787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,4,power_law_1.01,0.39587841033935545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,16,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,16,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,4,power_law_1.01,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,16,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,16,power_law_1.01,0.03377920091152191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,4,power_law_1.01,0.4612095832824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,16,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,4,power_law_1.01,0.5238783836364747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,16,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,16,power_law_1.01,0.035411199927330016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,16,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,4,power_law_1.01,0.6625279903411865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,16,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,4,power_law_1.01,0.8089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,16,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,16,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,16,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,4,power_law_1.01,1.2247039794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,16,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,16,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,4,power_law_1.01,1.557913589477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,4,power_law_1.2,13.456179809570312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,16,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,16,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,16,power_law_1.01,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,16,power_law_1.01,0.12472319602966309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,4,power_law_1.01,2.1921791076660155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,16,power_law_1.01,0.18350080251693726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,16,power_law_1.01,0.21299200057983397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,16,power_law_1.01,0.30677759647369385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,16,power_law_1.01,0.44462080001831056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,16,power_law_1.01,0.7098368167877197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,16,power_law_1.01,1.0196864128112793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,4,power_law_1.01,2.6896383285522463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,16,power_law_1.01,1.5460351943969726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,16,power_law_1.01,2.2579200744628904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,4,power_law_1.01,4.059135818481446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,4,power_law_1.01,5.189427185058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,4,power_law_1.2,17.86429443359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,4,power_law_1.2,24.78612518310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,2,power_law_1.01,0.1146880030632019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,2,power_law_1.01,0.09134079813957215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,2,power_law_1.01,0.11059199571609497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,2,power_law_1.01,0.27031679153442384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,2,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,2,power_law_1.01,0.27934720516204836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,2,power_law_1.01,0.2689023971557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,2,power_law_1.01,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,2,power_law_1.01,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,2,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,2,power_law_1.01,0.30064640045166013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,2,power_law_1.01,0.3074048042297363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,2,power_law_1.01,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,2,power_law_1.01,0.3211071968078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,2,power_law_1.01,0.34651520252227785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,2,power_law_1.01,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,2,power_law_1.01,0.37294080257415774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,2,power_law_1.01,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,2,power_law_1.01,0.5386240005493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,2,power_law_1.01,0.6723584175109864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,2,power_law_1.01,0.8294400215148926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,2,power_law_1.01,1.3447168350219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,2,power_law_1.01,1.721343994140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,2,power_law_1.01,3.095756721496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,2,power_law_1.01,3.1934463500976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,4,power_law_1.2,29.552230834960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,8,power_law_1.2,1.1356160163879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,8,power_law_1.2,1.3684672355651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,8,power_law_1.2,1.862656021118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,8,power_law_1.2,2.246041679382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,8,power_law_1.2,1.924710464477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,8,power_law_1.2,2.348236846923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,8,power_law_1.2,2.5995264053344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,8,power_law_1.2,2.5556991577148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,8,power_law_1.2,2.642739105224609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,8,power_law_1.2,2.4735744476318358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,8,power_law_1.2,2.7111040115356446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,8,power_law_1.2,2.6611711502075197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,32,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,8,power_law_1.2,2.718924713134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,8,power_law_1.01,0.03888640105724335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,32,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,32,power_law_1.2,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,8,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,8,power_law_1.2,2.834227180480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,32,power_law_1.2,0.055289602279663085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,8,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,8,power_law_1.01,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,32,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,8,power_law_1.01,0.08806399703025818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,8,power_law_1.2,2.7627519607543944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,32,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,8,power_law_1.01,0.13803520202636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,32,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,8,power_law_1.01,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,8,power_law_1.2,2.9024255752563475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,8,power_law_1.01,0.08458240032196045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,32,power_law_1.2,0.05589759945869446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,8,power_law_1.2,3.1678464889526365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,8,power_law_1.01,0.1001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,32,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,8,power_law_1.01,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,2,power_law_1.01,5.008383941650391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,32,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,8,power_law_1.01,0.09953280091285706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,8,power_law_1.2,3.268403244018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,32,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,8,power_law_1.01,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,8,power_law_1.01,0.14950400590896606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,32,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,8,power_law_1.01,0.12799999713897706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,8,power_law_1.01,0.14172159433364867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,32,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,8,power_law_1.2,3.5788799285888673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,32,power_law_1.2,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,8,power_law_1.01,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,8,power_law_1.01,0.2007040023803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,32,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,8,power_law_1.2,4.0548095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,8,power_law_1.01,0.21585919857025146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,32,power_law_1.2,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,8,power_law_1.01,0.2447360038757324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,32,power_law_1.2,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,32,power_law_1.2,0.12083200216293336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,8,power_law_1.01,0.26128640174865725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,32,power_law_1.2,0.16855039596557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,8,power_law_1.01,0.3215359926223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,8,power_law_1.2,5.002841567993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,32,power_law_1.2,0.2668544054031372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,8,power_law_1.01,0.399564790725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,32,power_law_1.2,0.32027521133422854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,8,power_law_1.01,0.6289408206939697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,32,power_law_1.2,0.4403200149536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,8,power_law_1.01,0.7983104228973389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,32,power_law_1.2,0.6141952037811279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,8,power_law_1.2,7.2173309326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,8,power_law_1.01,1.3682687759399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,32,power_law_1.2,0.9529343605041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,32,power_law_1.2,1.1706368446350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,8,power_law_1.01,1.6320512771606446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,32,power_law_1.2,2.145894432067871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,8,power_law_1.2,6.367846298217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,32,power_law_1.2,3.0625791549682617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,8,power_law_1.2,9.109299468994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,8,power_law_1.2,9.837139129638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,1,power_law_1.01,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,1,power_law_1.01,0.5490687847137451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,1,power_law_1.01,1.0297344207763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,2,balanced,0.3017386595408122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,1,power_law_1.01,2.0215808868408205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,2,balanced,0.5258239905039469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,2,balanced,1.0287786324818928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,2,balanced,1.0335573355356853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,2,balanced,1.034069299697876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,1,power_law_1.01,3.134464073181152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,2,balanced,1.0403839747111003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,2,balanced,1.0533546606699626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,2,balanced,1.061205307642619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,2,balanced,1.0794666608174641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,8,power_law_1.2,14.48406982421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,2,balanced,1.0845866998036702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,1,power_law_1.01,4.01530876159668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,2,balanced,1.0919253031412761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,2,balanced,1.1030186812082927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,2,balanced,1.1105279922485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,2,balanced,1.1224746704101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,2,balanced,1.5052800178527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,2,balanced,1.5619413057963054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,1,power_law_1.01,5.693644714355469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,2,balanced,1.6861866315205891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,2,balanced,1.9795626004536946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,2,balanced,2.0512426694234214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,1,power_law_1.01,5.9443199157714846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,2,balanced,2.5966933568318686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,2,balanced,2.9337600072224936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,2,balanced,3.89357852935791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,1,power_law_1.01,6.24310417175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,2,balanced,4.883797327677409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,1,power_law_1.01,6.43583984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,2,balanced,6.570837020874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,1,power_law_1.01,6.678733062744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,2,balanced,8.189098358154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,1,power_law_1.01,6.793215942382813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,2,balanced,11.290964762369791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,1,power_law_1.01,6.980608367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,1,power_law_1.01,7.103078460693359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,2,balanced,14.556320190429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,1,power_law_1.01,7.2841026306152346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,8,power_law_1.2,19.643597412109376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,1,power_law_1.01,7.464755249023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,1,power_law_1.01,7.7228034973144535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,1,power_law_1.01,8.118271636962891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,1,power_law_1.01,8.461106872558593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,1,power_law_1.01,9.090252685546876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,1,power_law_1.01,9.869721221923829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,1,power_law_1.01,10.994073486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,1,power_law_1.01,11.684864044189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,2,power_law_1.01,7.255039978027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,1,power_law_1.01,14.346444702148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,1,power_law_1.01,16.831692504882813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,1,power_law_1.01,23.090176391601563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,1,power_law_1.01,27.729510498046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,4,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,4,power_law_1.01,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,4,power_law_1.01,0.324403190612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,4,power_law_1.01,0.39342079162597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,4,power_law_1.01,0.4472832202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,4,power_law_1.01,0.5951488018035889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,4,power_law_1.01,0.6518784046173096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,4,power_law_1.01,0.6178815841674805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,4,power_law_1.01,0.6692863941192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,4,power_law_1.01,0.6371327877044678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,4,power_law_1.01,0.6752255916595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,4,power_law_1.01,0.6823935985565186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,4,power_law_1.01,0.6891520023345947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,4,power_law_1.01,0.7057407855987549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,4,power_law_1.01,0.7423999786376954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,4,power_law_1.01,0.7489535808563232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,4,power_law_1.01,0.7817215919494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,4,power_law_1.01,0.8400896072387696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,4,power_law_1.01,0.8921088218688965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,4,power_law_1.01,1.0358783721923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,4,power_law_1.01,1.1077631950378417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,4,power_law_1.01,1.4639103889465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,4,power_law_1.01,1.7227775573730468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,4,power_law_1.01,2.458624076843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,4,power_law_1.01,2.913894462585449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,4,power_law_1.01,4.3866111755371096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,4,power_law_1.01,5.83372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,4,balanced,0.04264000058174133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,4,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,4,balanced,0.2402986685434977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,4,balanced,0.241647998491923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,4,balanced,0.24217599630355835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,4,balanced,0.24371200799942017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,4,balanced,0.2450773318608602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,4,balanced,0.24627200762430826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,4,balanced,0.2491733431816101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,4,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,4,balanced,0.25361067056655884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,4,balanced,0.25514666239420575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,4,balanced,0.2577066620190938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,4,balanced,0.2734079957008362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,4,balanced,0.27134400606155396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,4,balanced,0.2768213351567586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,4,balanced,0.2950826684633891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,4,balanced,0.3575466473897298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,4,balanced,0.3444053332010905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,4,balanced,0.4307626485824585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,4,balanced,0.5345280170440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,4,balanced,0.8115200201670328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,4,balanced,1.0321919918060303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,4,balanced,1.5214932759602864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,4,balanced,1.9903146425882976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,4,balanced,2.9538774490356445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,2,power_law_1.2,0.22568960189819337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,2,power_law_1.2,0.31600639820098875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,4,balanced,3.8674774169921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,2,power_law_1.2,0.5662720203399658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,2,power_law_1.2,0.6924287796020507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,2,power_law_1.2,0.8292351722717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,2,power_law_1.2,1.4847999572753907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,2,power_law_1.2,1.6111616134643554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,2,power_law_1.2,1.671366310119629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,2,power_law_1.2,1.621811294555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,2,power_law_1.2,1.6801792144775392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,2,power_law_1.2,1.7233919143676757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,2,power_law_1.2,1.7285120010375976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,2,power_law_1.2,1.7321983337402345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,2,power_law_1.2,1.7893375396728515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,2,power_law_1.2,1.8509824752807618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,2,power_law_1.2,1.8743295669555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,2,power_law_1.2,1.8829311370849608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,2,power_law_1.2,1.959097671508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,2,power_law_1.2,2.1145599365234373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,2,power_law_1.2,2.5235456466674804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,2,power_law_1.2,2.787942314147949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,2,power_law_1.2,3.4461696624755858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,2,power_law_1.2,3.6962303161621093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,128,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,128,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,128,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,128,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,128,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,128,balanced,0.2908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,128,balanced,0.42205333709716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,128,balanced,0.4251306851704915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,128,balanced,0.42444801330566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,128,balanced,0.4249279896418254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,128,balanced,0.4271786610285441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,128,balanced,0.43025068442026776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,128,balanced,0.43195732434590656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,128,balanced,0.4341760079065959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,128,balanced,0.4416853189468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,128,balanced,0.44185598691304523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,128,balanced,0.4500480095545451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,2,power_law_1.2,5.075353622436523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,128,balanced,0.46437867482503253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,128,balanced,0.4795733292897542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,128,balanced,0.502613345781962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,128,balanced,0.5440853436787924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,128,balanced,0.601744016011556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,128,balanced,0.7330133120218912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,128,balanced,0.7732906341552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,128,balanced,1.0262186527252197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,128,balanced,1.214624007542928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,128,balanced,1.55511474609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,8,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,8,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,8,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,8,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,8,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,8,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,8,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,8,power_law_1.01,0.02743679881095886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,8,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,8,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,8,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,8,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,8,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,8,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,8,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,8,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,8,power_law_1.01,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,8,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,8,power_law_1.01,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,8,power_law_1.01,0.09748479723930359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,8,power_law_1.01,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,8,power_law_1.01,0.2699264049530029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,8,power_law_1.01,0.3807231903076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,8,power_law_1.01,0.49457921981811526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,8,power_law_1.01,0.775167989730835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,8,power_law_1.01,1.0362879753112793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,2,power_law_1.2,6.259916687011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,4,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,4,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,4,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,4,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,4,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,4,power_law_1.01,0.03951359987258911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,4,power_law_1.01,0.04320639967918396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,4,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,4,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,4,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,4,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,4,power_law_1.01,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,4,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,4,power_law_1.01,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,4,power_law_1.01,0.13230079412460327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,4,power_law_1.01,0.12984319925308227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,4,power_law_1.01,0.1837056040763855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,4,power_law_1.01,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,4,power_law_1.01,0.34549760818481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,4,power_law_1.01,0.4988607883453369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,4,power_law_1.01,0.5996543884277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,4,power_law_1.01,0.9418496131896973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,4,power_law_1.01,1.1331583976745605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,4,power_law_1.01,1.935763168334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,4,power_law_1.01,2.447564888000488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,4,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,4,power_law_1.2,0.2066431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,4,power_law_1.2,0.3028991937637329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,4,power_law_1.2,0.3772416114807129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,4,power_law_1.2,0.46489601135253905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,4,power_law_1.2,0.6377471923828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,4,power_law_1.2,0.6184895992279053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,4,power_law_1.2,0.659660816192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,4,power_law_1.2,0.6721536159515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,4,power_law_1.2,0.6891520023345947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,4,power_law_1.2,0.7067647933959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,4,power_law_1.2,0.7020415782928466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,4,power_law_1.2,0.6920191764831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,4,power_law_1.2,0.7413695812225342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,4,power_law_1.2,0.7823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,4,power_law_1.2,0.7671807765960693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,4,power_law_1.2,0.8187904357910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,4,power_law_1.2,0.8796159744262695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,4,power_law_1.2,0.9234432220458985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,4,power_law_1.2,1.0604543685913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,4,power_law_1.2,1.1773951530456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,4,power_law_1.2,1.6312255859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,4,power_law_1.2,1.8450431823730469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,4,power_law_1.2,2.779955291748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,4,power_law_1.2,3.7588993072509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,2,power_law_1.2,8.643583679199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,8,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,8,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,8,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,8,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,8,balanced,0.24712532758712769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,8,balanced,0.2501973311106364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,8,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,8,balanced,0.2527573307355245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,8,balanced,0.25361067056655884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,8,balanced,0.25446399052937824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,8,balanced,0.25668267409006756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,8,balanced,0.2585600018501282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,8,balanced,0.2609493335088094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,8,balanced,0.26641066869099933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,8,balanced,0.2744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,8,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,8,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,8,balanced,0.30395734310150146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,4,power_law_1.01,3.5932159423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,8,balanced,0.30907734235127765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,8,balanced,0.3426933288574219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,8,balanced,0.3710293372472127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,8,balanced,0.4346880118052165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,8,balanced,0.5024426778157552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,8,balanced,0.6778879960378011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,8,balanced,0.8961653709411621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,8,balanced,1.4008320172627766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,8,balanced,1.9024213155110676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,4,power_law_1.2,4.755046463012695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,4,power_law_1.2,6.021529769897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,4,power_law_1.01,5.110579299926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,2,power_law_1.2,11.706163024902343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,1,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,1,power_law_1.2,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,1,power_law_1.2,0.14315520524978637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,1,power_law_1.2,0.2578432083129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,1,power_law_1.2,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,1,power_law_1.2,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,1,power_law_1.2,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,1,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,1,power_law_1.2,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,1,power_law_1.2,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,1,power_law_1.2,0.29528961181640623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,1,power_law_1.2,0.2996223926544189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,1,power_law_1.2,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,1,power_law_1.2,0.2973695993423462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,1,power_law_1.2,0.3063807964324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,1,power_law_1.2,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,1,power_law_1.2,0.33136639595031736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,1,power_law_1.2,0.3960832118988037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,1,power_law_1.2,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,1,power_law_1.2,0.606822395324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,1,power_law_1.2,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,1,power_law_1.2,0.9746303558349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,1,power_law_1.2,1.2781567573547363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,8,balanced,0.06502399841944377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,8,balanced,0.29286400477091473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,8,balanced,0.5466453234354655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,8,balanced,1.0547146797180176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,8,balanced,2.030933380126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,8,balanced,4.016640027364095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,8,balanced,4.020906766255696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,8,balanced,4.027050654093425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,8,balanced,4.030805269877116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,8,balanced,4.033530553181966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,8,balanced,4.038474718729655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,8,balanced,4.05128542582194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,8,balanced,4.0586239496866865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,8,balanced,4.067328135172526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,8,balanced,4.09446398417155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,8,balanced,4.113578796386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,8,balanced,4.157098770141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,8,balanced,4.307456016540527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,8,balanced,4.386133193969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,8,balanced,4.4631039301554365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,8,balanced,4.553386688232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,8,balanced,5.343402862548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,8,balanced,5.544277191162109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,8,balanced,6.278144200642903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,8,balanced,6.536698659261067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,1,power_law_1.2,1.9929088592529296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,8,balanced,7.88530158996582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,8,balanced,9.598634719848633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,2,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,2,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,2,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,2,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,2,balanced,0.2380639910697937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,2,balanced,0.24078933397928873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,2,balanced,0.24337067206700644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,2,balanced,0.24678399165471396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,2,balanced,0.24862933158874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,2,balanced,0.2505386670430501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,2,balanced,0.254805326461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,2,balanced,0.2582186659177144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,2,balanced,0.26368000109990436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,2,balanced,0.2730666597684224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,2,balanced,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,2,balanced,0.2916693290074666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,2,balanced,0.31214932600657147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,2,balanced,0.3375786542892456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,2,balanced,0.3834880193074544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,2,balanced,0.4524373213450114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,2,balanced,0.5734133323033651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,2,balanced,0.8854080041249593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,2,balanced,1.18886399269104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,2,balanced,1.7551360130310059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,2,balanced,2.3521226247151694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,2,balanced,3.5031038920084634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,2,balanced,4.610186576843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,1,balanced,0.5232640107472738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,1,balanced,0.9064106941223145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,1,balanced,1.7718507448832195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,1,balanced,1.7744213740030925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,1,balanced,1.773738702138265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,1,balanced,1.7826132774353027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,1,balanced,1.7896107037862141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,1,balanced,1.8107733726501465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,1,balanced,1.8588959376017253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,1,power_law_1.2,2.6550271987915037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,1,balanced,1.864192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,1,balanced,1.8829654057820637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,1,balanced,1.9007147153218586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,1,balanced,1.9102719624837239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,1,balanced,1.939626693725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,1,balanced,2.4538453420003257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,1,balanced,2.577066739400228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,1,balanced,2.6427733103434243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,1,balanced,3.081727981567383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,1,balanced,3.3087145487467446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,1,balanced,3.87447452545166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,1,balanced,4.498773256937663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,1,balanced,6.115669250488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,1,balanced,7.589199701944987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,1,balanced,10.443605422973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,1,balanced,13.2138671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,1,balanced,18.929322560628254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,1,balanced,24.77465565999349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,1,power_law_1.2,3.996031951904297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,1,power_law_1.2,5.355091094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,2,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,2,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,2,balanced,0.07543466488520305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,2,balanced,0.27665066719055176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,2,balanced,0.532480001449585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,2,balanced,1.028608004252116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,2,balanced,1.5261012713114421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,2,balanced,1.5330986976623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,2,balanced,1.5412747065226238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,2,balanced,1.5435093243916829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,2,balanced,1.5580159823099773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,2,balanced,1.5730346043904622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,2,balanced,1.591466744740804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,2,balanced,1.6167252858479817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,2,balanced,1.6443732579549153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,2,balanced,1.664170742034912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,2,balanced,1.7177599271138508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,2,balanced,1.819818655649821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,2,balanced,1.9665919939676921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,2,balanced,2.177194595336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,2,balanced,2.3854079246520996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,2,balanced,2.90286922454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,2,balanced,3.385343869527181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,2,balanced,4.431525230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,2,balanced,5.324106534322103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,2,balanced,7.361024220784505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,2,balanced,9.415338516235352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,32,power_law_1.2,0.6017024040222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,32,power_law_1.2,0.7913472175598144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,32,power_law_1.2,0.7888895988464355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,32,power_law_1.2,0.7880703926086425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,32,power_law_1.2,0.7899136066436767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,32,power_law_1.2,0.6301695823669433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,32,power_law_1.2,0.6707200050354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,32,power_law_1.2,0.7227392196655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,32,power_law_1.2,0.7001855850219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,32,power_law_1.2,0.683622407913208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,32,power_law_1.2,0.6805503845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,32,power_law_1.2,0.7555071830749511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,32,power_law_1.2,0.710041618347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,32,power_law_1.2,0.6838079929351807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,32,power_law_1.2,0.6832128047943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,32,power_law_1.2,0.7493631839752197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,32,power_law_1.2,0.7749631881713868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,32,power_law_1.2,0.8298496246337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,32,power_law_1.2,0.8409088134765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,32,power_law_1.2,1.00065279006958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,32,power_law_1.2,1.0907648086547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,32,power_law_1.2,1.4409728050231934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,32,power_law_1.2,1.7633024215698243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,32,power_law_1.2,2.4999744415283205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,32,power_law_1.2,3.408076858520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,32,power_law_1.2,4.852531051635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,8,balanced,0.046762665112813316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,8,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,8,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,8,balanced,0.2739199995994568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,8,balanced,0.4360533157984416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,8,balanced,0.5541546742121378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,8,balanced,0.5575679937998453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,8,balanced,0.5597866773605347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,8,balanced,0.5620053211847941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,8,balanced,0.5637120008468628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,8,balanced,0.5683199961980184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,32,power_law_1.2,6.7688446044921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,8,balanced,0.5732693274815878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,8,balanced,0.5771946509679159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,8,balanced,0.5860693454742432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,8,balanced,0.59716268380483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,8,balanced,0.6043306589126587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,8,balanced,0.6244693199793497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,8,balanced,0.6463146607081095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,8,balanced,0.6824959913889567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,8,balanced,0.7717546621958414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,8,balanced,0.8622079690297445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,8,balanced,1.074005365371704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,8,balanced,1.26310396194458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,8,balanced,1.7762986818949382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,8,balanced,2.3012693723042807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,8,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,8,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,8,balanced,3.243690808614095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,8,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,8,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,8,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,8,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,8,balanced,4.168362617492676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,8,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,8,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,8,power_law_1.2,0.04156160056591034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,8,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,8,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,8,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,8,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,8,power_law_1.2,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,8,power_law_1.2,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,8,power_law_1.2,0.13619199991226197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,8,power_law_1.2,0.18595839738845826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,8,power_law_1.2,0.2500607967376709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,8,power_law_1.2,0.34979839324951173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,2,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,2,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,2,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,2,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,2,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,2,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,2,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,2,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,2,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,2,power_law_1.2,0.03868159949779511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,2,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,2,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,2,power_law_1.2,0.044223999977111815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,2,power_law_1.2,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,2,power_law_1.2,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,2,power_law_1.2,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,2,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,2,power_law_1.2,0.10383360385894776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,2,power_law_1.2,0.13598719835281373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,8,power_law_1.2,0.5939072132110595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,2,power_law_1.2,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,2,power_law_1.2,0.3096575975418091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,2,power_law_1.2,0.4917247772216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,2,power_law_1.2,0.6205440044403077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,2,power_law_1.2,0.9969663619995117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,8,power_law_1.2,0.85032958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,2,power_law_1.2,1.4155776023864746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,2,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,2,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,2,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,2,power_law_1.01,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,2,power_law_1.01,0.13107199668884278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,2,power_law_1.01,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,2,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,2,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,2,power_law_1.01,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,2,power_law_1.01,0.3086335897445679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,2,power_law_1.01,0.32131199836730956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,2,power_law_1.01,0.3411967992782593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,2,power_law_1.01,0.3397631883621216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,2,power_law_1.01,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,2,power_law_1.01,0.3526655912399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,2,power_law_1.01,0.37765119075775144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,2,power_law_1.01,0.38993918895721436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,2,power_law_1.01,0.41840639114379885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,2,power_law_1.01,0.46387200355529784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,2,power_law_1.01,0.5259263992309571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,2,power_law_1.01,0.5990399837493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,2,power_law_1.01,0.7927743911743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,2,power_law_1.01,1.0332159996032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,2,power_law_1.01,1.386291217803955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,2,power_law_1.01,1.9101696014404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,2,power_law_1.01,2.633113670349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,2,power_law_1.01,3.3284095764160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,2,power_law_1.2,2.1962751388549804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,8,power_law_1.2,0.2392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,1,power_law_1.01,0.21831679344177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,1,power_law_1.01,0.40529918670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,1,power_law_1.01,0.744652795791626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,8,power_law_1.2,0.2932735919952393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,8,power_law_1.2,0.3536895990371704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,1,power_law_1.01,1.2734463691711426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,8,power_law_1.2,0.39731199741363527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,1,power_law_1.01,1.863475227355957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,8,power_law_1.2,0.5150720119476319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,8,power_law_1.2,0.4419583797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,8,power_law_1.2,0.4870143890380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,1,power_law_1.01,3.042099189758301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,8,power_law_1.2,0.4916863918304443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,8,power_law_1.2,0.4884479999542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,1,power_law_1.01,3.3042430877685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,8,power_law_1.2,0.497049617767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,8,power_law_1.2,0.5017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,8,power_law_1.2,0.5394432067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,8,power_law_1.2,0.5398272037506103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,1,power_law_1.01,3.4584575653076173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,8,power_law_1.2,0.5658304214477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,8,power_law_1.2,0.5847040176391601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,1,power_law_1.01,3.549184036254883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,8,power_law_1.2,0.6023168087005615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,8,power_law_1.2,0.6004735946655273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,1,power_law_1.01,3.5755905151367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,8,power_law_1.2,0.6850560188293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,8,power_law_1.2,0.7393280029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,1,power_law_1.01,3.706675338745117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,8,power_law_1.2,0.8517312049865723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,8,power_law_1.2,0.9955327987670899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,1,power_law_1.01,3.84901123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,8,power_law_1.2,1.3576191902160644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,1,power_law_1.01,3.9358463287353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,8,power_law_1.2,1.5409152030944824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,8,power_law_1.2,2.283091163635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,1,power_law_1.01,4.108902359008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,1,power_law_1.01,4.194713592529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,1,power_law_1.01,4.315545654296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,8,power_law_1.2,2.767647933959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,1,power_law_1.01,4.533657455444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,8,power_law_1.2,3.861094284057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,1,power_law_1.01,4.889599990844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,1,power_law_1.01,5.199052810668945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,8,power_law_1.2,5.738086318969726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,1,power_law_1.01,5.9721729278564455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,1,power_law_1.01,6.644493103027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,8,power_law_1.2,1.379532814025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,1,power_law_1.01,8.250777435302734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,1,power_law_1.01,9.59078369140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,1,power_law_1.01,12.893388366699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,1,power_law_1.01,15.817292785644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,2,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,2,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,2,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,2,balanced,0.13260799646377563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,2,balanced,0.35037867228190106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,2,balanced,0.6666239897410074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,2,balanced,0.6705493132273356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,2,balanced,0.6756693522135416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,2,balanced,0.6772053241729736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,2,balanced,0.6802720228830973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,2,balanced,0.6845440069834391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,2,balanced,0.6918826897939047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,2,balanced,0.6976799964904785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,2,balanced,0.7072426478068033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,1,power_law_1.01,22.22773132324219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,2,balanced,0.716970682144165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,2,balanced,0.7289173603057861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,2,balanced,0.7451252937316895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,2,balanced,0.8046933015187582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,2,balanced,0.8446293671925863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,2,balanced,0.9069226582845052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,2,balanced,1.001301368077596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,2,balanced,1.2112212975819905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,2,balanced,1.398954709370931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,2,balanced,1.864192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,2,balanced,2.3138880729675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,2,balanced,3.24454402923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,2,balanced,4.164437294006348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,1,power_law_1.01,28.0047607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,2,power_law_1.2,2.824985694885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,64,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,64,power_law_1.2,0.03764480054378509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,64,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,64,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,64,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,64,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,64,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,64,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,64,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,64,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,64,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,64,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,64,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,64,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,64,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,64,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,4,balanced,0.3092479904492696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,64,power_law_1.2,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,4,balanced,0.5408426523208618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,64,power_law_1.2,0.10649600028991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,4,balanced,1.0513066450754802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,64,power_law_1.2,0.13021440505981446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,4,balanced,2.071376005808512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,64,power_law_1.2,0.18759679794311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,64,power_law_1.2,0.2949120044708252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,4,balanced,4.108799934387207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,64,power_law_1.2,0.4433919906616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,64,power_law_1.2,0.6471680164337158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,4,balanced,8.191488265991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,64,power_law_1.2,0.890880012512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,64,power_law_1.2,1.367244815826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,4,balanced,8.192341486612955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,4,balanced,7.999317169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,4,balanced,8.00921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,4,balanced,8.00989850362142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,4,balanced,8.02781867980957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,4,balanced,8.040618896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,4,balanced,8.062463760375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,4,balanced,8.083114624023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,4,balanced,8.113663991292318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,4,balanced,8.152064005533854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,4,balanced,8.22391446431478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,4,balanced,8.553130467732748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,4,balanced,8.751445134480795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,4,balanced,8.955392201741537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,4,balanced,9.173333485921225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,4,balanced,10.596181233723959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,4,balanced,11.258708953857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,4,balanced,11.714900970458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,4,balanced,12.612266540527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,4,balanced,14.842367808024088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,4,balanced,17.73533884684245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,8,power_law_1.2,1.7065984725952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,1,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,1,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,1,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,1,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,1,balanced,0.03956799954175949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,1,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,1,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,1,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,1,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,1,balanced,0.0422986646493276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,1,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,1,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,1,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,1,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,1,balanced,0.08823466300964355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,1,balanced,0.09386666615804036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,1,balanced,0.1513813336690267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,1,balanced,0.20906666914621988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,1,balanced,0.24661332368850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,1,balanced,0.3131733338038127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,1,balanced,0.4001813332239787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,1,balanced,0.6515839894612631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,1,balanced,0.8436053593953451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,1,balanced,1.3228373527526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,1,balanced,1.8853546778361003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,1,balanced,2.903866767883301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,1,balanced,3.9280640284220376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,2,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,2,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,2,balanced,0.07389866809050243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,2,balanced,0.27613866329193115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,2,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,2,balanced,1.0333866278330486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,2,balanced,1.0364586512247722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,2,balanced,1.0410666465759277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,2,balanced,1.0507946809132893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,2,balanced,1.0531840324401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,2,balanced,1.0629119873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,2,balanced,1.0774186452229817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,2,balanced,1.0883413155873616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,2,balanced,1.1158186594645183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,2,balanced,1.1460266908009846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,2,balanced,1.1665066878000896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,2,balanced,1.2115626335144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,2,balanced,1.3323946793874104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,2,balanced,1.4378666877746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,2,balanced,1.6363520622253418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,2,balanced,1.876479943593343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,2,balanced,2.406912008921305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,2,balanced,2.858666737874349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,2,balanced,3.870037396748861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,2,balanced,4.84881051381429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,4,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,4,power_law_1.01,0.06818559765815735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,2,balanced,6.9072214762369795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,4,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,4,power_law_1.01,0.2764415979385376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,4,power_law_1.01,0.3782272100448608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,4,power_law_1.01,0.5144256114959717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,2,balanced,8.892245610555014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,4,power_law_1.01,0.48066558837890627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,4,power_law_1.01,0.6782847881317139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,4,power_law_1.01,0.6731520175933838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,256,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,4,power_law_1.01,0.6440576076507568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,256,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,4,power_law_1.01,0.6731776237487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,256,power_law_1.01,0.05200639963150024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,256,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,4,power_law_1.01,0.6776832103729248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,256,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,4,power_law_1.01,0.6950911998748779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,256,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,4,power_law_1.01,0.6780928134918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,256,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,256,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,4,power_law_1.01,0.7475200176239014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,256,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,256,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,256,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,256,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,256,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,256,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,256,power_law_1.01,0.06654080152511596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,4,power_law_1.01,0.7591936111450195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,256,power_law_1.01,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,4,power_law_1.01,0.8128512382507325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,256,power_law_1.01,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,256,power_law_1.01,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,4,power_law_1.01,0.8587264060974121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,256,power_law_1.01,0.14438400268554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,256,power_law_1.01,0.23490560054779053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,4,power_law_1.01,0.9168895721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,256,power_law_1.01,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,4,power_law_1.01,1.053286361694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,256,power_law_1.01,0.510361623764038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,4,power_law_1.01,1.2285951614379882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,256,power_law_1.01,0.6696959972381592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,256,power_law_1.01,1.02543363571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,4,power_law_1.01,1.6029695510864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,256,power_law_1.01,1.4237695693969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,4,power_law_1.01,1.8335744857788085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,32,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,32,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,256,power_law_1.01,2.071142387390137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,4,power_law_1.01,2.4938432693481447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,32,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,32,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,32,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,256,power_law_1.01,2.9497343063354493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,32,power_law_1.01,0.028863999247550964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,4,power_law_1.01,3.1315967559814455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,32,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,32,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,32,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,32,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,32,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,32,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,32,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,4,power_law_1.01,4.293011093139649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,32,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,32,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,32,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,32,power_law_1.01,0.06591359972953796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,32,power_law_1.01,0.08908799886703492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,32,power_law_1.01,0.1079103946685791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,32,power_law_1.01,0.16855039596557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,32,power_law_1.01,0.20152320861816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,4,power_law_1.01,5.988761520385742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,32,power_law_1.01,0.3311615943908691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,32,power_law_1.01,0.4265984058380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,32,power_law_1.01,0.7208640098571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,32,power_law_1.01,1.003110408782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,4,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,4,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,4,balanced,0.031727999448776245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,4,balanced,0.20087466637293497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,4,balanced,0.37512532869974774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,4,balanced,0.49321067333221436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,4,balanced,0.49425065517425537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,4,balanced,0.49186134338378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,4,balanced,0.49373865127563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,4,balanced,0.4957866668701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,4,balanced,0.5128533442815145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,4,balanced,0.49186134338378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,4,balanced,0.4940799872080485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,4,balanced,0.4978346824645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,4,balanced,0.5050026575724283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,4,balanced,0.5092693169911703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,4,balanced,0.520362655321757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,4,balanced,0.5341866811116537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,4,balanced,0.552618662516276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,4,balanced,0.5886293252309164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,4,balanced,0.6234453519185384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,4,balanced,0.7017813523610433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,4,balanced,0.7867733637491862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,4,balanced,0.9786026477813721
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,4,balanced,1.1677013238271077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,4,balanced,1.6049493153889973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,4,balanced,2.139647960662842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,2,power_law_1.2,0.18063360452651978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,2,power_law_1.2,0.28979198932647704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,2,power_law_1.2,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,2,power_law_1.2,0.46878719329833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,2,power_law_1.2,0.47124481201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,2,power_law_1.2,0.4765632152557373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,2,power_law_1.2,0.4794367790222168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,2,power_law_1.2,0.49315838813781737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,2,power_law_1.2,0.5093376159667968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,2,power_law_1.2,0.5253119945526123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,2,power_law_1.2,0.5314559936523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,2,power_law_1.2,0.5257215976715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,2,power_law_1.2,0.5449728012084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,2,power_law_1.2,0.5685247898101806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,2,power_law_1.2,0.6045695781707764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,2,power_law_1.2,0.6379519939422608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,2,power_law_1.2,0.6742015838623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,2,power_law_1.2,0.9459712028503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,2,power_law_1.2,0.8970047950744628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,2,power_law_1.2,1.1565055847167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,2,power_law_1.2,1.4921728134155274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,1,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,1,balanced,0.24250666300455728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,1,balanced,0.4602880080540975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,1,balanced,0.45943466822306317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,1,balanced,0.4638719956080119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,1,balanced,0.4657493432362874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,1,balanced,0.4681386550267537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,1,balanced,0.4666026830673218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,1,balanced,0.46898667017618817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,1,balanced,0.47138134638468426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,1,balanced,0.4843519926071167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,1,balanced,0.4911786715189616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,1,balanced,0.49664000670115155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,1,balanced,0.504149317741394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,1,balanced,0.5032960176467896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,1,balanced,0.5113173325856527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,1,balanced,0.5442560116449991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,1,balanced,0.6016000111897787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,1,balanced,0.6749866803487142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,1,balanced,0.8101546764373779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,1,balanced,0.9951573212941488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,1,balanced,1.482752005259196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,1,balanced,2.016256014506022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,1,balanced,3.1271254221598306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,1,balanced,4.183722813924153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,1,balanced,6.295551935831706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,1,balanced,8.4585812886556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,2,power_law_1.2,2.3201791763305666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,2,power_law_1.2,2.73571834564209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,2,power_law_1.2,3.666124725341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,2,power_law_1.2,5.144575881958008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,2,power_law_1.2,7.1284736633300785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,1,power_law_1.2,0.8355839729309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,1,power_law_1.2,1.4477312088012695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,1,power_law_1.2,2.8854015350341795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,1,power_law_1.2,4.505804824829101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,1,power_law_1.2,6.394060897827148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,1,power_law_1.2,11.958067321777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,1,power_law_1.2,12.786483001708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,1,power_law_1.2,13.467852783203124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,1,power_law_1.2,13.72692413330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,1,power_law_1.2,14.213510131835937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,1,power_law_1.2,14.886093139648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,1,power_law_1.2,15.377203369140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,1,power_law_1.2,15.671693420410156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,1,power_law_1.2,16.133529663085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,1,power_law_1.2,16.58531799316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,2,power_law_1.2,9.222541046142577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,1,power_law_1.2,17.172064208984374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,2,power_law_1.01,0.18554879426956178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,2,power_law_1.01,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,2,power_law_1.01,0.4792319774627686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,2,power_law_1.01,0.5308224201202393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,1,power_law_1.2,17.441792297363282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,2,power_law_1.01,0.5326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,2,power_law_1.01,0.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,2,power_law_1.01,0.5425151824951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,2,power_law_1.01,0.5443583965301514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,2,power_law_1.01,0.5597184181213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,2,power_law_1.01,0.5562367916107178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,2,power_law_1.01,0.5976064205169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,2,power_law_1.01,0.5693056106567382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,2,power_law_1.01,0.6219776153564454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,2,power_law_1.01,0.5947391986846924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,2,power_law_1.01,0.6627327919006347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,1,power_law_1.2,18.24376983642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,2,power_law_1.01,0.6680319786071778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,2,power_law_1.01,0.7106368064880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,2,power_law_1.01,0.8867456436157226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,8,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,8,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,8,power_law_1.01,0.030508801341056824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,8,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,8,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,8,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,8,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,2,power_law_1.01,1.081107234954834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,8,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,8,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,8,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,8,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,8,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,8,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,8,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,1,power_law_1.2,19.008102416992188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,8,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,8,power_law_1.01,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,8,power_law_1.01,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,8,power_law_1.01,0.1511423945426941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,8,power_law_1.01,0.17775360345840455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,8,power_law_1.01,0.22753279209136962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,8,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,8,power_law_1.01,0.38871040344238283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,2,power_law_1.01,1.4049280166625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,8,power_law_1.01,0.637337589263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,8,power_law_1.01,0.9353216171264649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,2,power_law_1.01,1.5386624336242676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,8,power_law_1.01,1.176371192932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,2,power_law_1.01,2.574515151977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,1,power_law_1.2,20.480409240722658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,2,power_law_1.01,3.47955207824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,64,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,64,power_law_1.01,0.03969280123710632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,1,power_law_1.2,21.070643615722656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,64,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,64,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,64,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,64,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,64,power_law_1.01,0.03929600119590759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,64,power_law_1.01,0.039705601334571836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,64,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,64,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,64,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,64,power_law_1.01,0.045849600434303285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,64,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,64,power_law_1.01,0.05077120065689087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,64,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,64,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,64,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,64,power_law_1.01,0.08089600205421447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,64,power_law_1.01,0.0989184021949768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,64,power_law_1.01,0.13352960348129272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,64,power_law_1.01,0.15441919565200807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,64,power_law_1.01,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,1,power_law_1.2,24.6540283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,64,power_law_1.01,0.2789376020431519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,64,power_law_1.01,0.42229762077331545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,64,power_law_1.01,0.5517312049865722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,64,power_law_1.01,0.8316736221313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,64,power_law_1.01,1.1667455673217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,1,power_law_1.2,25.68089599609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,2,power_law_1.01,4.011008071899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,16,power_law_1.01,1.1345919609069823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,16,power_law_1.01,1.4045184135437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,16,power_law_1.01,1.286143970489502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,1,power_law_1.2,31.76202392578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,16,power_law_1.01,1.323417568206787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,16,power_law_1.01,1.2486656188964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,16,power_law_1.01,1.3213695526123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,16,power_law_1.01,1.2419072151184083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,16,power_law_1.01,1.3541376113891601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,16,power_law_1.01,1.305177593231201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,16,power_law_1.01,1.416806411743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,16,power_law_1.01,1.2681216239929198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,16,power_law_1.01,1.3897727966308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,16,power_law_1.01,1.4262271881103517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,16,power_law_1.01,1.488691234588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,16,power_law_1.01,1.5032320022583008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,8,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,16,power_law_1.01,1.641881561279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,8,power_law_1.01,0.5509119987487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,16,power_law_1.01,1.6191488265991212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,8,power_law_1.01,0.7987008094787598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,1,power_law_1.2,38.070068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,8,power_law_1.01,0.7520256042480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,16,power_law_1.01,1.802649688720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,8,power_law_1.01,0.8443903923034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,16,power_law_1.01,1.8139135360717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,8,power_law_1.01,0.9488384246826171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,2,power_law_1.01,5.74279670715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,8,power_law_1.01,0.8867839813232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,8,power_law_1.01,0.9103360176086426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,8,power_law_1.01,0.9207551956176758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,8,power_law_1.01,0.893337631225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,16,power_law_1.01,2.1768192291259765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,8,power_law_1.01,0.9814016342163085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,8,power_law_1.01,0.9650176048278809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,16,power_law_1.01,2.5997312545776365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,8,power_law_1.01,0.9654272079467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,8,power_law_1.01,1.0086400032043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,16,power_law_1.01,3.4641918182373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,8,power_law_1.01,0.9701375961303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,8,power_law_1.01,1.0092543601989745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,8,power_law_1.01,1.0491904258728026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,16,power_law_1.01,3.890790557861328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,8,power_law_1.01,1.1182080268859864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,8,power_law_1.01,1.1882495880126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,8,power_law_1.01,1.3582271575927733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,16,power_law_1.01,5.170380783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,8,power_law_1.01,1.4698495864868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,8,power_law_1.01,1.8130943298339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,16,power_law_1.01,6.136627197265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,8,power_law_1.01,1.901158332824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,8,power_law_1.01,2.5687999725341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,1,power_law_1.2,50.07646789550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,16,power_law_1.01,7.385906982421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,8,power_law_1.01,3.1485952377319335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,8,power_law_1.01,4.427161788940429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,16,power_law_1.01,11.105689239501952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,8,power_law_1.01,5.628108978271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,2,power_law_1.01,8.790835571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,1,power_law_1.2,58.7653076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,2,power_law_1.01,11.345503997802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,2,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,2,balanced,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,2,balanced,0.4522666533788045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,2,balanced,0.8751786549886068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,2,balanced,1.7341440518697102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,2,balanced,1.7745919227600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,2,balanced,1.782101313273112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,2,balanced,1.7344853083292644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,2,balanced,1.740458647410075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,2,balanced,1.744383970896403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,2,balanced,1.7588906288146973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,2,balanced,1.77237335840861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,2,balanced,1.789946715037028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,2,balanced,1.8119680086771648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,2,balanced,1.8691412607828777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,2,balanced,1.8884266217549641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,2,balanced,1.926143964131673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,2,balanced,1.9181226094563801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,2,balanced,2.0375893910725913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,2,balanced,2.1797547340393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,2,balanced,2.2976853052775064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,2,balanced,2.59822940826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,2,balanced,2.8779519399007163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,2,balanced,3.6618239084879556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,2,balanced,4.64298661549886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,2,balanced,6.837589263916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,2,balanced,8.950101216634115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,1,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,1,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,1,balanced,0.07850666840871175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,1,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,1,balanced,0.53657599290212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,1,balanced,1.0335573355356853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,1,balanced,1.042944033940633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,1,balanced,1.050112009048462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,1,balanced,1.0620533625284831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,1,balanced,1.0710986455281575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,1,balanced,1.0902079741160076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,1,balanced,1.1074559688568115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,1,balanced,1.1241546471913655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,1,balanced,1.1610453128814697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,1,balanced,1.198421319325765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,1,balanced,1.2322133382161458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,1,balanced,1.3059413433074951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,1,balanced,1.4506667455037434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,1,balanced,1.6102399826049805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,1,balanced,1.97324800491333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,1,balanced,2.3021225929260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,1,balanced,2.9503040313720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,1,balanced,3.6159146626790366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,1,balanced,5.024256070454915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,1,balanced,6.536671956380208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,1,balanced,9.487695693969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,1,balanced,12.35968017578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,4,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,4,balanced,0.27374933163324994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,4,balanced,0.27426133553187054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,4,balanced,0.2757973273595174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,4,balanced,0.27801599105199176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,4,balanced,0.2797226707140605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,4,balanced,0.2807413339614868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,4,balanced,0.2834773262341817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,4,balanced,0.2851840058962504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,4,balanced,0.2863786617914836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,4,balanced,0.28484266996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,4,balanced,0.2863786617914836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,4,balanced,0.2923520008722941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,4,balanced,0.30805333455403644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,4,balanced,0.3174399932225545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,4,balanced,0.31726932525634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,4,balanced,0.3628373146057129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,4,balanced,0.41864534219106037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,4,balanced,0.5259946584701538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,4,balanced,0.6563839912414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,4,balanced,0.907093365987142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,4,balanced,1.1298133532206218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,4,balanced,1.6728746096293132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,4,balanced,2.1802666982014975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,4,balanced,3.0916268030802407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,4,balanced,4.041386604309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,1,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,1,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,1,power_law_1.01,0.12984319925308227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,1,power_law_1.01,0.26112000942230223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,1,power_law_1.01,0.35389440059661864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,1,power_law_1.01,0.5765120029449463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,1,power_law_1.01,0.6053887844085694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,1,power_law_1.01,0.6338560104370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,1,power_law_1.01,0.648806381225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,1,power_law_1.01,0.6680575847625733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,1,power_law_1.01,0.6944767951965332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,1,power_law_1.01,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,1,power_law_1.01,0.734003210067749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,1,power_law_1.01,0.7946239948272705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,1,power_law_1.01,0.8142848014831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,1,power_law_1.01,0.841318416595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,1,power_law_1.01,0.9039872169494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,1,power_law_1.01,1.0366975784301757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,1,power_law_1.01,1.2369919776916505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,1,power_law_1.01,1.5581184387207032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,1,power_law_1.01,1.7657855987548827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,1,power_law_1.01,2.3410688400268556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,1,power_law_1.01,2.9134847640991213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,1,power_law_1.01,4.0734718322753904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,1,power_law_1.01,5.322547149658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,1,power_law_1.01,7.874150085449219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,4,power_law_1.2,0.43970561027526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,1,power_law_1.01,10.420428466796874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,4,power_law_1.2,0.5992447853088378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,4,power_law_1.2,0.7354368209838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,64,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,64,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,4,power_law_1.2,0.961945629119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,64,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,64,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,64,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,64,power_law_1.01,0.030073601007461547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,64,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,64,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,64,power_law_1.01,0.04645119905471802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,64,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,64,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,4,power_law_1.2,1.2543999671936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,64,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,64,power_law_1.01,0.06099839806556702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,64,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,4,power_law_1.2,1.6480255126953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,64,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,64,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,64,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,64,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,4,power_law_1.2,1.6887807846069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,64,power_law_1.01,0.11919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,64,power_law_1.01,0.1769215941429138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,4,power_law_1.2,1.704140853881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,64,power_law_1.01,0.2838527917861938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,4,power_law_1.2,1.7272768020629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,64,power_law_1.01,0.49356799125671386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,32,power_law_1.01,0.030687999725341798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,64,power_law_1.01,0.6098944187164307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,32,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,4,power_law_1.2,1.8315263748168946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,32,power_law_1.01,0.028038400411605834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,32,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,64,power_law_1.01,1.075814437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,32,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,4,power_law_1.2,1.9556352615356445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,32,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,32,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,16,power_law_1.2,0.39669759273529054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,32,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,64,power_law_1.01,1.2830719947814941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,32,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,4,power_law_1.2,1.9300352096557618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,32,power_law_1.01,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,16,power_law_1.2,0.4966400146484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,32,power_law_1.01,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,32,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,16,power_law_1.2,0.5136384010314942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,32,power_law_1.01,0.040524798631668094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,4,power_law_1.2,2.025062370300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,32,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,32,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,16,power_law_1.2,0.5502975940704345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,32,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,4,power_law_1.2,2.0121599197387696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,32,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,16,power_law_1.2,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,32,power_law_1.01,0.05997440218925476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,32,power_law_1.01,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,4,power_law_1.2,2.106572723388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,16,power_law_1.2,0.5150720119476319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,32,power_law_1.01,0.09297919869422913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,32,power_law_1.01,0.14704639911651612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,16,power_law_1.2,0.46448640823364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,32,power_law_1.01,0.24432640075683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,4,power_law_1.2,2.0930431365966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,16,power_law_1.2,0.4704256057739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,32,power_law_1.01,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,16,power_law_1.2,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,32,power_law_1.01,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,16,power_law_1.2,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,4,power_law_1.2,2.1995391845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,16,power_law_1.2,0.51179518699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,32,power_law_1.01,0.9807871818542481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,16,power_law_1.2,0.5431295871734619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,4,power_law_1.2,2.3578624725341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,16,power_law_1.2,0.5253119945526123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,32,power_law_1.01,1.4518272399902343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,16,power_law_1.2,0.5607232093811035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,4,power_law_1.2,2.505523109436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,16,power_law_1.2,0.5689343929290771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,16,power_law_1.2,0.5898240089416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,4,power_law_1.2,2.7977727890014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,16,power_law_1.2,0.6207295894622803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,16,power_law_1.2,0.6533120155334473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,4,power_law_1.2,2.9904895782470704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,16,power_law_1.2,0.6957056045532226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,16,power_law_1.2,0.8415231704711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,16,power_law_1.2,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,4,power_law_1.2,3.749465560913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,16,power_law_1.2,1.2423168182373048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,4,power_law_1.2,4.137984085083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,16,power_law_1.2,1.4249983787536622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,4,power_law_1.2,5.703270339965821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,16,power_law_1.2,2.106777572631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,16,power_law_1.2,2.6669055938720705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,4,power_law_1.2,6.6914306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,16,power_law_1.2,4.297113418579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,4,power_law_1.2,9.025536346435548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,16,power_law_1.2,5.231820678710937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,4,power_law_1.2,12.031999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,4,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,4,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,4,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,4,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,4,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,4,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,4,balanced,0.22101332743962607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,4,balanced,0.23176532983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,4,balanced,0.23466666539510092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,4,balanced,0.2373973329861959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,4,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,4,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,4,balanced,0.25463465849558514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,4,balanced,0.2635093331336975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,4,balanced,0.2757973273595174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,4,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,4,balanced,0.3068586587905884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,4,balanced,0.34679468472798664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,4,balanced,0.3819520076115926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,4,balanced,0.45926400025685626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,4,balanced,0.5420373280843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,4,balanced,0.7729492982228597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,4,balanced,0.9902079900105795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,4,balanced,1.5131306648254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,4,balanced,2.128554662068685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,4,balanced,3.203925450642904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,4,balanced,4.31496524810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,128,power_law_1.2,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,128,power_law_1.2,0.29122560024261473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,128,power_law_1.2,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,128,power_law_1.2,0.22466559410095216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,128,power_law_1.2,0.2545664072036743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,128,power_law_1.2,0.26910719871520994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,128,power_law_1.2,0.29614078998565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,128,power_law_1.2,0.27175040245056153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,128,power_law_1.2,0.27197439670562745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,128,power_law_1.2,0.30023679733276365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,128,power_law_1.2,0.3026943922042847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,128,power_law_1.2,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,128,power_law_1.2,0.314572811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,128,power_law_1.2,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,128,power_law_1.2,0.31969280242919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,128,power_law_1.2,0.3278847932815552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,128,power_law_1.2,0.3379199981689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,128,power_law_1.2,0.4040703773498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,128,power_law_1.2,0.451584005355835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,128,power_law_1.2,0.5425024032592773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,128,power_law_1.2,0.6070271968841553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,128,power_law_1.2,0.8550399780273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,128,power_law_1.2,1.136025619506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,128,power_law_1.2,1.7377279281616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,128,power_law_1.2,2.4672256469726563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,128,power_law_1.2,3.7578750610351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,16,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,16,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,16,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,16,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,16,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,16,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,16,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,16,power_law_1.01,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,16,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,16,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,16,power_law_1.01,0.03909119963645935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,16,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,16,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,16,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,16,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,16,power_law_1.01,0.0831488013267517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,16,power_law_1.01,0.08392320275306701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,16,power_law_1.01,0.12206079959869384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,16,power_law_1.01,0.16381440162658692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,16,power_law_1.01,0.24145920276641847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,16,power_law_1.01,0.3375103950500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,16,power_law_1.01,0.41451520919799806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,16,power_law_1.01,0.6264832019805908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,16,power_law_1.01,0.9441023826599121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,8,power_law_1.01,0.04668160080909729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,8,power_law_1.01,0.0497408002614975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,16,power_law_1.01,1.2220416069030762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,8,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,8,power_law_1.01,0.046463999152183535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,8,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,8,power_law_1.01,0.048921599984169006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,8,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,8,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,8,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,8,power_law_1.01,0.05242239832878113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,8,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,8,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,8,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,8,power_law_1.01,0.06079360246658325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,8,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,8,power_law_1.01,0.06922240257263183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,8,power_law_1.01,0.077811199426651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,8,power_law_1.01,0.12757760286331177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,8,power_law_1.01,0.19435520172119142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,8,power_law_1.01,0.24657919406890869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,8,power_law_1.01,0.33136639595031736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,8,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,128,power_law_1.2,5.790310287475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,8,power_law_1.01,0.6750207901000976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,8,power_law_1.01,1.0000384330749512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,8,power_law_1.01,1.3623231887817382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,8,power_law_1.01,2.107596778869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,8,power_law_1.01,2.913279914855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,32,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,32,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,32,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,32,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,32,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,32,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,32,balanced,0.05902933577696482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,32,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,32,balanced,0.058864002426465355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,32,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,32,balanced,0.05919999877611796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,32,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,32,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,32,balanced,0.06297599772612254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,32,balanced,0.06741333504517873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,32,balanced,0.06980266670385997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,32,balanced,0.08703999718030293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,32,balanced,0.1390720009803772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,32,balanced,0.18500266472498575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,32,balanced,0.244053324063619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,32,balanced,0.2669173280398051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,32,balanced,0.3426986535390218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,32,balanced,0.3566933472951253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,32,balanced,0.5196586847305298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,32,balanced,0.6294186512629191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,32,balanced,1.0180266698201497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,32,balanced,1.3463892936706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,8,power_law_1.2,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,8,power_law_1.2,0.27238399982452394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,8,power_law_1.2,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,8,power_law_1.2,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,8,power_law_1.2,0.2756608009338379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,8,power_law_1.2,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,2,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,2,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,2,balanced,0.237226665019989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,8,power_law_1.2,0.32194559574127196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,2,balanced,0.452949325243632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,8,power_law_1.2,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,2,balanced,0.8832000096638998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,8,power_law_1.2,0.3680255889892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,2,balanced,0.8891733487447103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,8,power_law_1.2,0.4380671977996826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,2,balanced,0.8917333285013834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,2,balanced,0.8971947034200033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,8,power_law_1.2,0.5617663860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,2,balanced,0.9009493192036947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,8,power_law_1.2,0.6795263767242432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,2,balanced,0.9028213024139404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,2,balanced,0.9108479817708334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,2,balanced,0.9229653676350912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,8,power_law_1.2,0.7086080074310303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,2,balanced,0.9280800024668375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,2,balanced,0.9430932998657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,8,power_law_1.2,0.5998591899871826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,2,balanced,0.9738240242004395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,2,balanced,0.989525318145752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,8,power_law_1.2,0.7270400047302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,2,balanced,1.0170026620229085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,2,balanced,1.0763946374257405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,8,power_law_1.2,0.8249343872070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,2,balanced,1.1156480312347412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,2,balanced,1.2373332977294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,8,power_law_1.2,0.901734447479248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,2,balanced,1.3608959515889485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,2,balanced,1.6440320014953613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,2,balanced,1.9188052813212078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,8,power_law_1.2,1.17391357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,2,balanced,2.5630720456441245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,2,balanced,3.24181334177653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,2,balanced,4.704085350036621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,2,balanced,6.171648025512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,8,power_law_1.2,1.3996031761169434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,8,power_law_1.2,1.9329023361206055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,8,power_law_1.2,2.492825508117676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,8,power_law_1.2,3.4545665740966798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,8,power_law_1.2,4.146176147460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,1,power_law_1.01,0.33607680797576905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,1,power_law_1.01,0.5531648159027099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,1,power_law_1.01,1.0483712196350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,1,power_law_1.01,2.0170751571655274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,1,power_law_1.01,3.663257598876953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,1,power_law_1.01,5.063475036621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,1,power_law_1.01,6.0045310974121096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,1,power_law_1.01,7.97470703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,1,power_law_1.01,8.24606704711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,8,power_law_1.2,5.7368511199951175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,1,power_law_1.01,8.521100616455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,1,power_law_1.01,9.032281494140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,1,power_law_1.01,9.314508819580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,1,power_law_1.01,9.400934600830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,1,power_law_1.01,9.899212646484376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,1,power_law_1.01,9.957990264892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,1,power_law_1.01,10.144972991943359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,1,power_law_1.01,10.43988494873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,1,power_law_1.01,11.105075073242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,1,power_law_1.01,11.440742492675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,1,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,1,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,1,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,1,power_law_1.01,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,1,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,1,power_law_1.01,0.21422080993652343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,1,power_law_1.01,0.2320319890975952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,1,power_law_1.01,0.2381824016571045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,1,power_law_1.01,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,1,power_law_1.01,12.255232238769532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,1,power_law_1.01,0.25026559829711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,1,power_law_1.01,0.2637824058532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,1,power_law_1.01,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,1,power_law_1.01,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,1,power_law_1.01,0.3026943922042847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,1,power_law_1.01,0.3121151924133301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,1,power_law_1.01,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,1,power_law_1.01,0.34611198902130125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,1,power_law_1.01,0.39772160053253175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,1,power_law_1.01,0.4745215892791748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,1,power_law_1.01,0.6557695865631104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,1,power_law_1.01,12.96240692138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,1,power_law_1.01,0.8636416435241699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,1,power_law_1.01,1.306009578704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,1,power_law_1.01,1.7057792663574218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,1,power_law_1.01,2.4788991928100588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,1,power_law_1.01,3.274342346191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,1,power_law_1.01,14.231756591796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,1,power_law_1.01,4.960460662841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,8,power_law_1.2,6.9445442199707035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,1,power_law_1.01,6.677299499511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,1,power_law_1.01,14.731263732910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,8,power_law_1.2,9.026764678955079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,1,power_law_1.01,17.32874298095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,1,power_law_1.01,19.341722106933595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,1,power_law_1.01,25.636248779296874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,1,power_law_1.01,31.21397705078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,8,power_law_1.2,13.23888702392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,8,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,8,balanced,0.038218667109807335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,8,balanced,0.2384213407834371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,8,balanced,0.45585068066914874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,8,balanced,0.8768853346506754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,8,balanced,0.8797866503397623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,8,balanced,0.8813066482543945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,8,balanced,0.8838826815287272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,8,balanced,0.8861013253529867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,8,balanced,0.8888320128122965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,8,balanced,0.8936106363932291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,8,balanced,0.9011200269063314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,8,balanced,0.9094666639963785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,8,balanced,0.9161386489868164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,32,balanced,0.04453866680463155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,32,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,32,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,8,balanced,0.9374720255533854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,32,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,32,balanced,0.3264853358268738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,8,balanced,0.942250649134318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,32,balanced,0.37836798032124835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,32,balanced,0.3802453279495239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,8,balanced,0.9562453428904215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,32,balanced,0.38178133964538574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,32,balanced,0.38365864753723145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,8,balanced,0.9772106806437174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,32,balanced,0.385535995165507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,32,balanced,0.38707200686136883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,8,balanced,0.9823573430379232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,32,balanced,0.38860801855723065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,32,balanced,0.39202133814493817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,8,balanced,1.0463573137919109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,32,balanced,0.3966133197148641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,32,balanced,0.40345601240793866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,32,balanced,0.4082239866256714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,8,balanced,1.0664959748586018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,32,balanced,0.41779200236002606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,32,balanced,0.43775999546051025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,8,balanced,1.2014933427174885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,32,balanced,0.48418132464090985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,32,balanced,0.5413546562194824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,8,balanced,1.2912586530049641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,32,balanced,0.5415253241856893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,8,balanced,1.6510292689005535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,32,balanced,0.606549342473348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,32,balanced,0.6807893117268881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,8,balanced,2.0512426694234214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,32,balanced,0.8852480252583822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,32,balanced,1.1018239657084148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,8,balanced,3.0660266876220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,32,balanced,1.622528076171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,8,balanced,3.9949652353922525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,32,balanced,2.1725865999857583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,2,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,2,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,2,power_law_1.2,0.11366399526596069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,2,power_law_1.2,0.1955839991569519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,2,power_law_1.2,0.2263040065765381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,2,power_law_1.2,0.4237311840057373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,2,power_law_1.2,0.41840639114379885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,2,power_law_1.2,0.4403200149536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,2,power_law_1.2,0.4380608081817627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,2,power_law_1.2,0.4405248165130615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,2,power_law_1.2,0.47124481201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,2,power_law_1.2,0.4749311923980713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,2,power_law_1.2,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,2,power_law_1.2,0.49459199905395507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,2,power_law_1.2,0.5036032199859619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,2,power_law_1.2,0.5130239963531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,2,power_law_1.2,0.5505023956298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,2,power_law_1.2,0.6123519897460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,2,power_law_1.2,0.6627327919006347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,2,power_law_1.2,0.8032064437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,2,power_law_1.2,0.9197567939758301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,2,power_law_1.2,1.23187198638916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,2,power_law_1.2,1.477836799621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,2,power_law_1.2,2.0942848205566404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,2,power_law_1.01,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,2,power_law_1.01,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,2,power_law_1.01,0.416153621673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,2,power_law_1.01,0.5597184181213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,2,power_law_1.01,0.6950911998748779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,2,power_law_1.01,1.0983424186706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,2,power_law_1.01,1.1919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,2,power_law_1.01,1.1757568359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,2,power_law_1.01,1.2517312049865723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,2,power_law_1.01,1.2636159896850585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,2,power_law_1.01,1.2986368179321288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,2,power_law_1.01,1.3111295700073242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,2,power_law_1.01,1.3162495613098144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,2,power_law_1.01,1.4047231674194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,2,power_law_1.01,1.4522368431091308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,2,power_law_1.01,1.4454784393310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,2,power_law_1.01,1.4944255828857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,2,power_law_1.01,1.6242687225341796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,2,power_law_1.01,1.7088512420654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,2,power_law_1.2,2.729984092712402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,2,power_law_1.01,1.9376127243041992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,2,power_law_1.01,2.0992000579833983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,2,power_law_1.01,2.5730880737304687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,2,power_law_1.01,3.1219711303710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,2,power_law_1.01,4.048896026611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,2,power_law_1.01,4.888371276855469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,2,power_law_1.01,7.320575714111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,2,power_law_1.01,8.653209686279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,2,power_law_1.2,4.142079925537109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,16,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,16,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,16,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,16,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,16,power_law_1.01,0.036857599020004274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,16,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,16,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,16,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,16,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,16,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,16,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,16,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,16,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,16,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,16,power_law_1.01,0.0460671991109848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,16,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,16,power_law_1.01,0.05015680193901062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,16,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,16,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,16,power_law_1.01,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,16,power_law_1.01,0.09175040125846863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,16,power_law_1.01,0.13270399570465088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,16,power_law_1.01,0.22568318843841553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,16,power_law_1.01,0.34713599681854246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,16,power_law_1.01,0.46305279731750487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,16,power_law_1.01,0.749567985534668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,16,power_law_1.01,1.0272768020629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,2,power_law_1.2,4.924825668334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,2,power_law_1.01,1.1415552139282226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,2,power_law_1.01,2.081996726989746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,2,power_law_1.01,2.772377586364746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,2,power_law_1.01,4.289100646972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,2,power_law_1.01,5.643673706054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,2,power_law_1.01,8.427519989013671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,2,power_law_1.01,8.903884887695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,2,power_law_1.01,9.19552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,2,power_law_1.01,9.152921295166015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,2,power_law_1.01,9.741926574707032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,2,power_law_1.01,9.805824279785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,2,power_law_1.01,10.101554870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,2,power_law_1.01,10.122239685058593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,2,power_law_1.01,10.95761947631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,2,power_law_1.01,11.190668487548828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,64,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,64,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,64,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,64,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,64,balanced,0.049141332507133484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,64,balanced,0.05171200136343638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,64,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,64,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,64,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,64,balanced,0.056320001681645714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,64,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,64,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,64,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,64,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,64,balanced,0.06553600231806438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,64,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,64,balanced,0.08311466872692108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,64,balanced,0.09557333588600159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,64,balanced,0.15769599874814352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,64,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,64,balanced,0.28569600979487103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,2,power_law_1.01,11.52327651977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,64,balanced,0.36113067468007404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,64,balanced,0.4413439830144246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,64,balanced,0.6022826830546061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,64,balanced,0.8227840264638265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,64,balanced,1.193984031677246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,2,power_law_1.01,11.782144165039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,64,balanced,1.5788373947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,2,power_law_1.01,12.083609771728515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,2,power_law_1.01,12.274073791503906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,2,power_law_1.01,13.277798461914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,2,power_law_1.01,15.507046508789063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,32,1,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,32,1,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,32,1,balanced,0.06331733365853627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,32,1,balanced,0.09079466263453166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,32,1,balanced,0.29129600524902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,32,1,balanced,0.5422079960505167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,32,1,balanced,0.552618662516276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,32,1,balanced,0.5577386617660522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,32,1,balanced,0.5691519975662231
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,32,1,balanced,0.5746346712112427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,32,1,balanced,0.5918720165888468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,2,power_law_1.01,18.179481506347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,32,1,balanced,0.6063786745071411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,32,1,balanced,0.6191733280817667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,32,1,balanced,0.6517759958902994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,32,1,balanced,0.6842026710510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,32,1,balanced,0.7075786590576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,32,1,balanced,0.7879679997762045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,32,1,balanced,0.9238186677296957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,32,1,balanced,1.0876586437225342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,32,1,balanced,1.4260907173156738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,32,1,balanced,1.7752745946248372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,32,1,balanced,2.415445327758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,32,1,balanced,3.087530771891276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,2,power_law_1.01,18.286387634277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,32,1,balanced,4.4910933176676435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,32,1,balanced,5.981354395548503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,32,1,balanced,9.004202524820963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,2,power_law_1.01,23.507353210449217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,32,1,balanced,11.82907740275065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,2,power_law_1.01,26.86484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,2,power_law_1.01,36.87321472167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,2,power_law_1.01,44.56857604980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,4,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,4,power_law_1.01,0.029683199524879456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,4,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,4,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,4,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,4,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,4,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,4,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,4,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,4,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,4,power_law_1.01,0.04504320025444031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,4,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,4,power_law_1.01,0.0566976010799408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,4,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,4,power_law_1.01,0.09338240027427673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,4,power_law_1.01,0.08028159737586975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,4,power_law_1.01,0.09440000057220459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,4,power_law_1.01,0.12225919961929321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,4,power_law_1.01,0.15646719932556152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,4,power_law_1.01,0.22671360969543458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,4,power_law_1.01,0.30658559799194335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,1,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,1,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,1,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,1,power_law_1.01,0.15073280334472655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,1,power_law_1.01,0.22954239845275878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,1,power_law_1.01,0.37537920475006104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,1,power_law_1.01,0.4038656234741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,1,power_law_1.01,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,1,power_law_1.01,0.429260778427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,1,power_law_1.01,0.437011194229126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,1,power_law_1.01,0.4433919906616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,1,power_law_1.01,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,1,power_law_1.01,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,1,power_law_1.01,0.4712384223937988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,1,power_law_1.01,0.48472962379455564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,1,power_law_1.01,0.4943871974945068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,1,power_law_1.01,0.5115647792816163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,1,power_law_1.01,0.5543615818023682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.5941247940063477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,4,power_law_1.01,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.7137087821960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.8638208389282227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,1,power_law_1.01,1.145638370513916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,1,power_law_1.01,1.3508607864379882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,1,power_law_1.01,1.8900991439819337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,1,power_law_1.01,2.3640064239501952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,1,power_law_1.01,3.493888092041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,4,power_law_1.01,0.6123519897460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,1,power_law_1.01,4.6630912780761715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,4,power_law_1.01,0.8894463539123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,4,power_law_1.01,1.4534655570983888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,4,power_law_1.01,2.3856832504272463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,64,power_law_1.01,0.8427328109741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,64,power_law_1.01,0.799948787689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,64,power_law_1.01,0.8044544219970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,64,power_law_1.01,0.799948787689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,64,power_law_1.01,0.7278592109680175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,64,power_law_1.01,0.6545407772064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,64,power_law_1.01,0.7610367774963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,64,power_law_1.01,0.6805503845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,64,power_law_1.01,0.6840320110321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,64,power_law_1.01,0.6842368125915528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,64,power_law_1.01,0.78438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,64,power_law_1.01,0.7643136024475098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,64,power_law_1.01,0.7948287963867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,64,power_law_1.01,0.800972843170166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,64,power_law_1.01,0.8366080284118652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,64,power_law_1.01,0.7663616180419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,64,power_law_1.01,0.832307243347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,64,power_law_1.01,0.9392127990722656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,64,power_law_1.01,0.943718433380127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,64,power_law_1.01,1.035264015197754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,64,power_law_1.01,1.1812864303588868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,64,power_law_1.01,1.3047807693481446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,64,power_law_1.01,1.52227840423584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,64,power_law_1.01,2.369721603393555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,64,power_law_1.01,2.8409856796264648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,64,power_law_1.01,4.139622497558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,64,power_law_1.01,4.461951828002929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,4,power_law_1.01,3.637247848510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,4,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,4,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,4,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,4,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,4,balanced,0.0718506673971812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,4,balanced,0.2800640066464742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,4,balanced,0.28228267033894855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,4,balanced,0.28091732660929364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,4,balanced,0.28381866216659546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,4,balanced,0.28330665826797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,4,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,4,balanced,0.2887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,4,balanced,0.3107840021451314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,4,balanced,0.30582932631174725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,4,balanced,0.3094186584154765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,4,balanced,0.3256266713142395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,4,balanced,0.33928533395131427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,4,balanced,0.377344012260437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,4,balanced,0.41096532344818115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,4,balanced,0.47870934009552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,4,balanced,0.6323200066884359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,4,balanced,0.9352533022562662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,4,balanced,1.2366507053375244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,4,balanced,1.8486612637837727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,4,balanced,2.4284159342447915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,4,balanced,3.527850786844889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,4,balanced,4.6863358815511065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,8,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,8,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,8,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,8,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,8,balanced,0.06741333504517873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,8,balanced,0.20565332969029745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,8,balanced,0.20804266134897867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,8,balanced,0.20872533321380615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,8,balanced,0.21076800425847372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,8,balanced,0.21230934063593546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,8,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,8,balanced,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,8,balanced,0.22254933913548788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,8,balanced,0.2285226583480835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,8,balanced,0.23569067319234213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,8,balanced,0.24320000410079956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,8,balanced,0.2553173303604126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,8,balanced,0.27989333868026733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,8,balanced,0.30805333455403644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,8,balanced,0.35396265983581543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,8,balanced,0.3862186670303345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,8,balanced,0.4901546637217204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,8,balanced,0.5693440039952596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,8,balanced,0.8673280080159506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,8,balanced,1.2301653226216633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,8,balanced,1.8913280169169109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,8,balanced,2.493098735809326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,16,power_law_1.2,1.0530816078186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,16,power_law_1.2,2.068070411682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,16,power_law_1.2,2.952396774291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,16,power_law_1.2,2.975539207458496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,16,power_law_1.2,3.05664005279541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,16,power_law_1.2,3.078144073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,16,power_law_1.2,2.3992319107055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,16,power_law_1.2,2.592972755432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,4,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,16,power_law_1.2,2.368716812133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,4,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,4,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,4,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,4,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,16,power_law_1.2,2.5958208084106444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,4,power_law_1.2,0.14295040369033812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,4,power_law_1.2,0.13349759578704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,4,power_law_1.2,0.14479360580444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,16,power_law_1.2,2.5866111755371093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,4,power_law_1.2,0.1435647964477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,4,power_law_1.2,0.17838079929351808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,4,power_law_1.2,0.20992000102996827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,16,power_law_1.2,2.2796287536621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,4,power_law_1.2,0.21278719902038573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,4,power_law_1.2,0.19169280529022217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,16,power_law_1.2,2.5081855773925783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,4,power_law_1.2,0.23552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,4,power_law_1.2,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,4,power_law_1.2,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,4,power_law_1.2,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,16,power_law_1.2,2.6382335662841796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,4,power_law_1.2,0.319488000869751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,4,power_law_1.2,0.3596287965774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,4,power_law_1.2,0.41021437644958497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,16,power_law_1.2,2.7119424819946287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,4,power_law_1.2,0.531660795211792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,4,power_law_1.2,0.7813119888305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,16,power_law_1.2,2.979840087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,4,power_law_1.2,0.9598976135253906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,16,power_law_1.2,2.9825023651123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,4,power_law_1.2,1.6801792144775392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,16,power_law_1.2,3.1066047668457033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,16,power_law_1.2,3.322060775756836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,4,power_law_1.2,2.161868858337402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,16,power_law_1.2,3.604889678955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,16,power_law_1.2,3.788800048828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,16,power_law_1.2,4.747673416137696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,16,power_law_1.2,5.1910655975341795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,16,power_law_1.2,6.366803359985352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,16,power_law_1.2,8.15103988647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,4,power_law_1.2,3.356671905517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,16,power_law_1.2,13.495500183105468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,4,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,4,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,4,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,4,power_law_1.2,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,4,power_law_1.2,0.09871360063552856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,4,power_law_1.2,0.2125823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,4,power_law_1.2,0.21790719032287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,4,power_law_1.2,0.2381824016571045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,4,power_law_1.2,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,4,power_law_1.2,0.237772798538208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,4,power_law_1.2,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,4,power_law_1.2,0.2357248067855835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,4,power_law_1.2,0.25026559829711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,16,power_law_1.2,12.940083312988282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,4,power_law_1.2,0.25128960609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,4,power_law_1.2,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,4,power_law_1.2,0.260915207862854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,4,power_law_1.2,0.27729918956756594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,4,power_law_1.2,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,4,power_law_1.2,0.28958721160888673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,4,power_law_1.2,0.33402879238128663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,4,power_law_1.2,0.3983360052108765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,4,power_law_1.2,0.51179518699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,4,power_law_1.2,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,4,power_law_1.2,0.9021439552307129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,4,power_law_1.2,4.283596801757812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,4,power_law_1.2,1.2230655670166015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,4,power_law_1.2,1.6963584899902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,16,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,16,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,16,power_law_1.2,0.027846398949623107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,16,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,16,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,16,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,16,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,16,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,16,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,16,power_law_1.2,0.034790399670600894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,16,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,16,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,16,power_law_1.2,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,16,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,16,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,16,power_law_1.2,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,4,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,4,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,16,power_law_1.2,0.15564800500869752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,4,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,16,power_law_1.2,0.26746881008148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,4,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,16,power_law_1.2,0.3215359926223755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,4,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,4,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,4,power_law_1.01,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,4,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,4,power_law_1.01,0.043808001279830935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,4,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,4,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,4,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,4,power_law_1.01,0.05160319805145264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,4,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,4,power_law_1.01,0.05730559825897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,4,power_law_1.2,2.306867218017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,4,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,4,power_law_1.01,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,4,power_law_1.01,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,4,power_law_1.01,0.21237759590148925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,4,power_law_1.01,0.25968639850616454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,4,power_law_1.01,0.4229119777679443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,4,power_law_1.01,0.6293504238128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,4,power_law_1.01,1.110630416870117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,4,power_law_1.01,1.4063615798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,4,power_law_1.01,2.3013376235961913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,4,power_law_1.01,2.9497343063354493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,16,power_law_1.2,0.5750783920288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,16,power_law_1.2,0.7491583824157715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.8742912292480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,1,power_law_1.2,1.6300031661987304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,1,power_law_1.2,2.409676742553711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,1,power_law_1.2,3.246080017089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,32,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,32,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,1,power_law_1.2,5.544960021972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,32,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,32,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,32,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,32,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,32,power_law_1.2,0.04361599981784821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,32,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,32,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,1,power_law_1.2,6.201548767089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,32,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,32,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,32,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,32,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,32,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,32,power_law_1.2,0.05651199817657471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,1,power_law_1.2,6.415769958496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,32,power_law_1.2,0.05979520082473755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,32,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,32,power_law_1.2,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,32,power_law_1.2,0.10854400396347046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,32,power_law_1.2,0.16015360355377198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,32,power_law_1.2,0.24801280498504638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,1,power_law_1.2,6.341427230834961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,32,power_law_1.2,0.39874560832977296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,32,power_law_1.2,0.5062655925750732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,32,power_law_1.2,0.8255488395690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,1,power_law_1.2,6.604185485839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,1,power_law_1.2,6.654771423339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,1,power_law_1.2,6.840525054931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,32,power_law_1.2,1.146675205230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,16,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,16,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,16,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,16,balanced,0.30666132767995197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,1,power_law_1.2,6.801817321777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,16,balanced,0.5906773408253988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,16,balanced,0.7277226448059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,16,balanced,0.7287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,32,power_law_1.2,2.010111999511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,16,balanced,0.7313066323598226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,16,balanced,0.7321493625640869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,16,balanced,0.734549363454183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,16,balanced,0.7386453151702881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,16,balanced,0.7410346666971842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,16,balanced,0.7439359823862711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,16,balanced,0.7500800291697184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,16,balanced,0.7567359606424967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,16,balanced,0.7685120105743408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,16,balanced,0.7796053091684977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,16,balanced,0.8330240249633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,16,balanced,0.8260266780853271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,16,balanced,0.8820052941640218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,1,power_law_1.2,7.0529022216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,16,balanced,0.8717652956644694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,16,balanced,0.9502399762471517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,16,balanced,1.0400426387786865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,16,balanced,1.2992853323618572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,1,power_law_1.2,7.066419219970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,16,balanced,1.6017066637674968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,1,power_law_1.2,7.214080047607422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,16,balanced,2.268160025278727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,16,balanced,3.0271145502726235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,32,power_law_1.2,2.4471551895141603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,1,power_law_1.2,7.288217926025391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,1,power_law_1.2,7.622246551513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,16,power_law_1.2,1.3602815628051759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,1,power_law_1.2,8.022016143798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,1,power_law_1.2,8.856985473632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,1,power_law_1.2,10.085990142822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,1,power_law_1.2,12.340428924560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,1,power_law_1.2,12.548915100097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,16,power_law_1.2,1.8307071685791017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,1,power_law_1.2,16.477389526367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,1,power_law_1.2,19.722650146484376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,1,power_law_1.2,26.471014404296874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,2,power_law_1.01,0.2125823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,2,power_law_1.01,0.3573760032653809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,2,power_law_1.01,0.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,2,power_law_1.01,0.8435711860656738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,2,power_law_1.01,1.2132351875305176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,2,power_law_1.01,1.4295040130615235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,2,power_law_1.01,1.8774015426635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,2,power_law_1.01,2.011136054992676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,2,power_law_1.01,2.0635648727416993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,2,power_law_1.01,2.1925888061523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,2,power_law_1.01,2.220025634765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,2,power_law_1.01,2.2665216445922853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,2,power_law_1.01,2.232524871826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,64,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,2,power_law_1.01,2.286796760559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,64,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,64,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,2,power_law_1.01,2.388991928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,64,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,64,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,2,power_law_1.01,2.4936447143554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,64,power_law_1.01,0.037452799081802365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,64,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,64,power_law_1.01,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,2,power_law_1.01,2.5090047836303713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,64,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,64,power_law_1.01,0.04423039853572845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,64,power_law_1.01,0.04829440116882324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,2,power_law_1.01,2.5554943084716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,64,power_law_1.01,0.05077760219573975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,64,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,64,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,2,power_law_1.01,2.630451202392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,64,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,64,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,64,power_law_1.01,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,2,power_law_1.01,2.773811149597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,64,power_law_1.01,0.11550719738006592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,64,power_law_1.01,0.14991359710693358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,64,power_law_1.01,0.22405118942260743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,2,power_law_1.01,2.9521728515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,64,power_law_1.01,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,64,power_law_1.01,0.38195199966430665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,2,power_law_1.01,3.4414592742919923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,64,power_law_1.01,0.7004096031188964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,64,power_law_1.01,0.8501248359680176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,2,power_law_1.01,3.7380096435546877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,2,power_law_1.01,4.855193710327148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,2,power_law_1.01,5.236326217651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,2,power_law_1.01,7.140351867675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,2,power_law_1.01,8.68823013305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,1,power_law_1.2,32.45363159179688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,8,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,8,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,8,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,8,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,8,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,8,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,8,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,8,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,8,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,8,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,8,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,8,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,8,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,8,balanced,0.06195199986298879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,8,balanced,0.07799466451009114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,8,balanced,0.19114667177200317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,8,balanced,0.19847999016443887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,8,balanced,0.27187200387318927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,8,balanced,0.3054933349291484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,8,balanced,0.5135360161463419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,8,balanced,0.716970682144165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,8,balanced,1.1864746411641438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,8,balanced,1.544874668121338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,2,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,2,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,2,balanced,0.24200532833735147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,2,balanced,0.24302933613459268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,2,balanced,0.24371200799942017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,2,balanced,0.24541866779327393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,2,balanced,0.24712532758712769
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,2,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,2,balanced,0.2512213389078776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,2,balanced,0.25190399090449017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,2,balanced,0.2542933424313863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,2,balanced,0.2573653260866801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,2,balanced,0.25890133778254193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,2,balanced,0.27135999997456867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,2,balanced,0.2734079957008362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,2,balanced,0.28142933050791424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,2,balanced,0.28910932938257855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,2,balanced,0.3228800098101298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,2,balanced,0.3421866496404012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,2,balanced,0.44064001242319745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,2,balanced,0.5331626733144125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,2,balanced,0.7999146779378256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,2,balanced,1.109503984451294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,2,balanced,1.665877342224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,2,balanced,2.2244693438212075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,2,balanced,3.3430185317993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,2,balanced,4.41429328918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,16,4,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,16,4,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,16,4,power_law_1.2,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,16,4,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,16,4,power_law_1.2,0.10158079862594604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,16,4,power_law_1.2,0.11735039949417114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,16,4,power_law_1.2,0.22322559356689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,16,4,power_law_1.2,0.23019518852233886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,16,4,power_law_1.2,0.2654207944869995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,16,4,power_law_1.2,0.2500351905822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,16,4,power_law_1.2,0.25886719226837157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,16,4,power_law_1.2,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,16,4,power_law_1.2,0.2844543933868408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,16,4,power_law_1.2,0.29614078998565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,16,4,power_law_1.2,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,16,4,power_law_1.2,0.342630410194397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,16,4,power_law_1.2,0.37519359588623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,16,4,power_law_1.2,0.41799678802490237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,16,4,power_law_1.2,0.4501503944396973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,16,4,power_law_1.2,0.5355519771575927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,16,4,power_law_1.2,0.6569856166839599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,16,4,power_law_1.2,0.8975999832153321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,16,4,power_law_1.2,1.276313591003418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,16,4,power_law_1.2,1.8583551406860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,16,4,power_law_1.2,2.346393585205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,16,4,power_law_1.2,3.833241653442383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,16,4,power_law_1.2,4.880793762207031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,1,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,1,power_law_1.01,0.19517439603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,1,power_law_1.01,0.36659200191497804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,1,power_law_1.01,0.6062079906463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,1,power_law_1.01,0.8579071998596192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,1,power_law_1.01,1.42807035446167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,1,power_law_1.01,1.5271936416625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,1,power_law_1.01,1.5421440124511718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,1,power_law_1.01,1.6021503448486327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,1,power_law_1.01,1.641472053527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,1,power_law_1.01,1.7045503616333009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,1,power_law_1.01,1.7242111206054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,1,power_law_1.01,1.7975296020507812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,1,power_law_1.01,1.8362367630004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,1,power_law_1.01,1.8753536224365235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,1,power_law_1.01,1.92040958404541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,8,power_law_1.2,0.2678783893585205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,8,power_law_1.2,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,8,power_law_1.2,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,1,power_law_1.01,1.8989055633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,8,power_law_1.2,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,8,power_law_1.2,0.24145920276641847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,8,power_law_1.2,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,1,power_law_1.01,2.0142080307006838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,8,power_law_1.2,0.2486272096633911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,8,power_law_1.2,0.2514944076538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,8,power_law_1.2,0.25088000297546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,1,power_law_1.01,2.0975616455078123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,8,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,8,power_law_1.2,0.3126976013183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,8,power_law_1.2,0.33607680797576905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,1,power_law_1.01,2.288640022277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,8,power_law_1.2,0.35635199546813967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,8,power_law_1.2,0.3684351921081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,1,power_law_1.01,2.5024511337280275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,8,power_law_1.2,0.41308159828186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,1,power_law_1.01,3.018342399597168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,8,power_law_1.2,0.4972544193267822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,1,power_law_1.01,3.428761672973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,8,power_law_1.2,0.5834752082824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,1,power_law_1.01,4.351795196533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,8,power_law_1.2,0.8103679656982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,1,power_law_1.01,4.924620819091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,8,power_law_1.2,0.9316351890563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,1,power_law_1.01,6.778265380859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,1,power_law_1.01,8.22783966064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,8,power_law_1.2,1.4346112251281737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,8,power_law_1.2,1.8520063400268554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,8,power_law_1.2,2.711552047729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,8,power_law_1.2,3.3875968933105467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,1,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,1,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,1,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,1,balanced,0.23944532871246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,1,balanced,0.45584531625111896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,1,balanced,0.4626773198445638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,1,balanced,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,1,balanced,0.4739413261413574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,1,balanced,0.4802560011545817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,1,balanced,0.48503466447194415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,1,balanced,0.49817601839701336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,8,power_law_1.2,5.153177642822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,1,balanced,0.5111466646194458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,1,balanced,0.5193386475245158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,1,balanced,0.5396426518758138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,1,balanced,0.5597866773605347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,1,balanced,0.5806080102920532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,1,balanced,0.6184959808985392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,1,balanced,0.6971680323282877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,1,balanced,0.8002560138702393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,1,balanced,1.0424319903055828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,1,balanced,1.2854613463083904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,1,balanced,1.749333381652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,1,balanced,2.252629280090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,1,balanced,3.345050811767578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,1,balanced,4.457130750020345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,8,power_law_1.2,0.05015040040016174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,1,balanced,6.644053141276042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,8,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,8,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,8,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,8,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,1,balanced,8.741205215454102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,8,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,8,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,8,power_law_1.2,0.058963197469711306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,8,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,8,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,8,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,8,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,8,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,8,power_law_1.2,0.06798080205917359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,8,power_law_1.2,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,8,power_law_1.2,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,8,power_law_1.2,0.08704000115394592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,8,power_law_1.2,0.1679360032081604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,8,power_law_1.2,0.20660479068756105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,8,power_law_1.2,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,8,power_law_1.2,0.3876863956451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,8,power_law_1.2,0.5406720161437988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,8,power_law_1.2,0.7141248226165772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,8,power_law_1.2,1.1282431602478027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,8,power_law_1.2,1.6953344345092773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,8,power_law_1.2,2.6259456634521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,8,power_law_1.2,3.5971073150634765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,8,power_law_1.2,6.02869758605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,16,power_law_1.2,0.6254591941833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,16,power_law_1.2,0.7026688098907471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,16,power_law_1.2,0.6756351947784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,16,power_law_1.2,0.7020544052124024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,16,power_law_1.2,0.5951488018035889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,16,power_law_1.2,0.6688767910003662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,16,power_law_1.2,0.6053887844085694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,16,power_law_1.2,0.649625587463379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,16,power_law_1.2,0.6807551860809327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,16,power_law_1.2,0.7081984043121338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,16,power_law_1.2,0.7102464199066162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,16,power_law_1.2,0.7028736114501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,16,power_law_1.2,0.7206912040710449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,16,power_law_1.2,0.7383039951324463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,16,power_law_1.2,0.7620607852935791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,16,power_law_1.2,0.7692287921905517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,16,power_law_1.2,0.7935999870300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,16,power_law_1.2,0.8183808326721191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,16,power_law_1.2,0.9588671684265136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,16,power_law_1.2,1.1943936347961426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,16,power_law_1.2,1.3260736465454102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,16,power_law_1.2,1.8591743469238282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,16,power_law_1.2,2.4829952239990236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,16,power_law_1.2,3.2026622772216795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,16,power_law_1.2,3.841843032836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,16,power_law_1.2,6.130688095092774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,8,power_law_1.2,9.06588134765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,16,power_law_1.2,8.754994964599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,8,power_law_1.2,11.754496002197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,1,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,1,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,1,balanced,0.09181867043177287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,1,balanced,0.30719999472300213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,1,balanced,0.5838506619135538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,1,balanced,0.730282704035441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,1,balanced,0.736255963643392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,1,balanced,0.7538346449534098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,1,balanced,0.7647573153177897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,1,balanced,0.7734613418579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,1,balanced,0.7792479991912842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,1,balanced,0.8002560138702393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,1,balanced,0.8159573078155518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,1,balanced,0.8550399939219157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,1,balanced,0.8854186534881592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,1,balanced,0.9159466425577799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,1,balanced,0.9885013103485107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,1,balanced,1.1226186752319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,1,balanced,1.2950186729431152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,1,balanced,1.6443732579549153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,1,balanced,1.9831466674804688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,1,balanced,2.746709187825521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,1,balanced,3.5659093856811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,1,balanced,5.171365420023601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,1,balanced,6.860799789428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,1,balanced,10.094591776529947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,1,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,1,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,1,power_law_1.2,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,1,power_law_1.2,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,1,power_law_1.2,0.4034560203552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,1,balanced,13.252948760986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,1,power_law_1.2,0.6971392154693603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,1,power_law_1.2,0.7651328086853028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,1,power_law_1.2,0.8042495727539063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,1,power_law_1.2,0.8359935760498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,1,power_law_1.2,0.8935423851013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,1,power_law_1.2,0.881868839263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,1,power_law_1.2,0.9215999603271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,1,power_law_1.2,0.9345024108886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,1,power_law_1.2,0.9506815910339356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,1,power_law_1.2,0.973414421081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,1,power_law_1.2,0.992460823059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,1,power_law_1.2,1.0297344207763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,1,power_law_1.2,1.0885120391845704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,1,power_law_1.2,1.1462656021118165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,1,power_law_1.2,1.3103103637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,1,power_law_1.2,1.4577664375305175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,1,power_law_1.2,1.7696767807006837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,1,power_law_1.2,2.044723129272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,1,power_law_1.2,2.685951995849609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,1,power_law_1.2,3.1741952896118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,64,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,64,power_law_1.2,0.036620798707008365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,64,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,64,power_law_1.2,0.03500159978866577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,64,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,64,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,64,power_law_1.2,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,64,power_law_1.2,0.03705599904060364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,64,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,64,power_law_1.2,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,64,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,64,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,64,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,64,power_law_1.2,0.047679999470710756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,64,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,64,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,64,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,64,power_law_1.2,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,64,power_law_1.2,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,64,power_law_1.2,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,64,power_law_1.2,0.12899839878082275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,64,power_law_1.2,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,64,power_law_1.2,0.22200319766998292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,1,power_law_1.2,4.344012832641601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,64,power_law_1.2,0.36618239879608155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,64,power_law_1.2,0.46940159797668457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,64,power_law_1.2,0.8630271911621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,64,power_law_1.2,1.1612159729003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.2695168018341064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.3901439905166626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.5824512004852295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.8652799606323243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.881868839263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.9134079933166503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.9193471908569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.9332736015319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.9472000122070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.9324543952941895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.981811237335205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.9836544036865235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,1,power_law_1.01,1.024409580230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,1,power_law_1.01,1.0493824005126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,1,power_law_1.01,1.1247615814208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,1,power_law_1.01,1.1395071983337401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,1,power_law_1.01,1.2421119689941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,1,power_law_1.01,1.4532608032226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,1,power_law_1.01,1.5308799743652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,1,power_law_1.01,1.8954240798950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,1,power_law_1.01,2.2841344833374024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,1,power_law_1.2,5.4673408508300785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,1,power_law_1.01,3.15863037109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,1,power_law_1.01,3.936870574951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,1,power_law_1.01,5.615206527709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,1,power_law_1.01,7.129087829589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,8,balanced,0.26897066831588745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,8,balanced,0.2402986685434977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,8,balanced,0.2404693365097046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,8,balanced,0.24081067244211832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,8,balanced,0.24149332443873087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,8,balanced,0.24337067206700644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,8,balanced,0.24439465999603271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,8,balanced,0.2445653279622396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,8,balanced,0.2474666635195414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,8,balanced,0.24900267521540323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,8,balanced,0.253440002600352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,8,balanced,0.25309866666793823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,8,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,8,balanced,0.2667520046234131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,8,balanced,0.26793599128723145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,8,balanced,0.27357866366704303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,8,balanced,0.2792106668154399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,8,balanced,0.3725653489430745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,8,balanced,0.39611732959747314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,8,balanced,0.5302613178888956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,8,balanced,0.6212266683578491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,8,balanced,0.9115306536356608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,8,balanced,1.0905600388844807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,8,balanced,1.5684266090393066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,8,balanced,2.0317866007486978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,8,balanced,2.952021280924479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,8,balanced,3.807061195373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,1,power_law_1.01,10.36759033203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,2,power_law_1.2,0.6156288146972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,2,power_law_1.2,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,2,power_law_1.2,1.490944004058838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,2,power_law_1.2,2.4713024139404296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,2,power_law_1.2,3.5160064697265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,2,power_law_1.2,3.860889434814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,2,power_law_1.2,5.860332870483399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,2,power_law_1.2,6.266470336914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,2,power_law_1.2,6.5603584289550785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,2,power_law_1.2,6.6050048828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,2,power_law_1.2,6.594150543212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,2,power_law_1.2,6.74853744506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,2,power_law_1.2,7.171238708496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,2,power_law_1.2,7.318732452392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,2,power_law_1.2,7.5530242919921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,2,power_law_1.2,7.894630432128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,2,power_law_1.2,7.977779388427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,2,power_law_1.2,8.609996795654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,2,power_law_1.2,8.847564697265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,2,power_law_1.2,9.390898895263671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,2,power_law_1.2,10.37844467163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,2,power_law_1.2,11.618508911132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,128,power_law_1.01,0.05508480072021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,128,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,128,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,2,power_law_1.2,13.596672058105469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,128,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,128,power_law_1.01,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,128,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,128,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,128,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,128,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,128,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,128,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,128,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,128,power_law_1.01,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,128,power_law_1.01,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,128,power_law_1.01,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,2,power_law_1.2,16.70819854736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,128,power_law_1.01,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,128,power_law_1.01,0.11673599481582642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,128,power_law_1.01,0.14929920434951782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,128,power_law_1.01,0.2072511911392212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,128,power_law_1.01,0.27095038890838624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,128,power_law_1.01,0.30453760623931886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,128,power_law_1.01,0.38830080032348635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,128,power_law_1.01,0.5064703941345214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,128,power_law_1.01,0.7518208026885986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,2,power_law_1.2,17.379942321777342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,128,power_law_1.01,1.0493951797485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,128,power_law_1.01,1.4637056350708009
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,128,power_law_1.01,2.272256088256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,2,power_law_1.2,22.014361572265624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,2,power_law_1.2,26.651205444335936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,1,power_law_1.01,13.786726379394532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.45567998886108396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.556608009338379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,1,power_law_1.01,1.03689603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,1,power_law_1.01,1.008844757080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,1,power_law_1.01,1.0448896408081054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,1,power_law_1.01,1.0579968452453614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,1,power_law_1.01,1.086464023590088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,1,power_law_1.01,1.0790911674499513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,1,power_law_1.01,1.1079680442810058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,1,power_law_1.01,1.094655990600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,1,power_law_1.01,1.1327232360839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,1,power_law_1.01,1.147494411468506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,1,power_law_1.01,1.2302335739135741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,1,power_law_1.01,1.265664005279541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,1,power_law_1.01,1.328947162628174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,1,power_law_1.01,1.4133248329162598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,1,power_law_1.01,1.5587136268615722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,1,power_law_1.01,1.8149375915527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,1,power_law_1.01,2.239897537231445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,1,power_law_1.01,2.6091455459594726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,1,power_law_1.01,3.494911956787109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,4,2,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,4,2,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,4,2,balanced,0.28194133440653485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,4,2,balanced,0.2841599980990092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,4,2,balanced,0.2773333390553792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,128,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,128,balanced,0.04981866478919983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,128,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,128,balanced,0.05170666674772898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,128,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,128,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,128,balanced,0.05444266895453135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,128,balanced,0.05494933327039083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,128,balanced,0.05509333312511444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,128,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,128,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,128,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,128,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,128,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,128,balanced,0.06519466638565063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,128,balanced,0.07884799937407176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,128,balanced,0.09471999605496724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,4,2,balanced,0.2790186603864034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,128,balanced,0.1518933375676473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,4,2,balanced,0.2805440028508504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,128,balanced,0.23995733261108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,4,2,balanced,0.28194133440653485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,4,2,balanced,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,128,balanced,0.28433066606521606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,4,2,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,4,2,balanced,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,128,balanced,0.3575466473897298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,128,balanced,0.43059198061625165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,128,balanced,0.5963040192921957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,128,balanced,0.7973546981811523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,4,2,balanced,0.2983253399531047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,4,2,balanced,0.30088533957799274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,128,balanced,1.1448319753011067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,4,2,balanced,0.29661866029103595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,4,2,balanced,0.30086400111516315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,4,2,balanced,0.30532266696294147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,4,2,balanced,0.3263466755549113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,4,2,balanced,0.35140268007914227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,4,2,balanced,0.38841064771016437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,128,balanced,1.5223466555277507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,4,2,balanced,0.4638719956080119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,4,2,balanced,0.5809493462244669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,4,2,balanced,0.871397336324056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,4,2,balanced,1.1415893236796062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,4,2,balanced,1.7181013425191243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,4,2,balanced,2.3895039558410645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,4,2,balanced,3.668309211730957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,1,power_law_1.01,4.392531204223633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,4,2,balanced,4.913322766621907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,16,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,16,balanced,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,16,balanced,0.021674667795499165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,16,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,16,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,16,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,16,balanced,0.02388266722361247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,16,balanced,0.02405333270629247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,16,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,16,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,16,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,16,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,16,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,16,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,16,balanced,0.027813332776228588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,16,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,16,balanced,0.03326933334271113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,16,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,16,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,16,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,16,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,16,balanced,0.1302186648050944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,16,balanced,0.22118399540583292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,16,balanced,0.3386026620864868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,16,balanced,0.4633599917093913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,1,power_law_1.01,6.095257568359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,1,power_law_1.01,7.7012992858886715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,32,power_law_1.01,0.3158015966415405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,32,power_law_1.01,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,32,power_law_1.01,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,32,power_law_1.01,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,32,power_law_1.01,0.22425599098205568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,32,power_law_1.01,0.16486400365829468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,32,power_law_1.01,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,32,power_law_1.01,0.2623487949371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,32,power_law_1.01,0.27729918956756594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,32,power_law_1.01,0.2514944076538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,32,power_law_1.01,0.26746881008148193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,32,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,32,power_law_1.01,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,32,power_law_1.01,0.27013120651245115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,32,power_law_1.01,0.3018752098083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,32,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,32,power_law_1.01,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,32,power_law_1.01,0.33853440284729003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,32,power_law_1.01,0.34549760818481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,32,power_law_1.01,0.3936255931854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,32,power_law_1.01,0.430079984664917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,32,power_law_1.01,0.5748735904693604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,32,power_law_1.01,0.7522175788879395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,32,power_law_1.01,1.1302911758422851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,32,power_law_1.01,1.3103103637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,32,power_law_1.01,1.906483268737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,32,power_law_1.01,2.779136085510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,1,power_law_1.01,11.36209945678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,1,power_law_1.01,14.688665771484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,64,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,64,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,64,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,64,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,64,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,64,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,64,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,64,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,64,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,64,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,64,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,64,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,64,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,64,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,64,power_law_1.2,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,64,power_law_1.2,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,64,power_law_1.2,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,64,power_law_1.2,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,64,power_law_1.2,0.107315194606781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,64,power_law_1.2,0.15278079509735107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,64,power_law_1.2,0.19394559860229493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,8,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,64,power_law_1.2,0.2637824058532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,8,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,64,power_law_1.2,0.3448832035064697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,8,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,8,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,64,power_law_1.2,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,8,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,8,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,8,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,64,power_law_1.2,0.7047167778015136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,8,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,8,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,64,power_law_1.2,1.1667455673217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,8,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,8,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,8,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,64,power_law_1.2,1.8685951232910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,8,power_law_1.01,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,8,power_law_1.01,0.11448320150375366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,8,power_law_1.01,0.13127679824829103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,8,power_law_1.01,0.1884160041809082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,8,power_law_1.01,0.31436800956726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,8,power_law_1.01,0.42741761207580564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,8,power_law_1.01,0.6397952079772949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,8,power_law_1.01,1.0584063529968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,8,power_law_1.01,1.3737983703613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,8,power_law_1.01,2.30010871887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,4,power_law_1.01,1.1300864219665527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,4,power_law_1.01,1.9300352096557618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,4,power_law_1.01,2.428108787536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,4,power_law_1.01,3.2399360656738283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,4,power_law_1.01,3.240550231933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,4,power_law_1.01,4.724326324462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,128,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,128,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,128,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,4,power_law_1.01,4.683980941772461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,128,power_law_1.01,0.029075199365615846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,128,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,128,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,128,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,128,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,128,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,128,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,4,power_law_1.01,4.950835037231445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,128,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,128,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,128,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,128,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,128,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,128,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,4,power_law_1.01,4.757708740234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,128,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,128,power_law_1.01,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,128,power_law_1.01,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,128,power_law_1.01,0.1462272047996521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,128,power_law_1.01,0.18001919984817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,4,power_law_1.01,4.8529407501220705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,128,power_law_1.01,0.27729918956756594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,128,power_law_1.01,0.36761600971221925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,128,power_law_1.01,0.68853759765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,4,power_law_1.01,5.016556930541992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,128,power_law_1.01,0.8693759918212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,128,power_law_1.01,1.5112192153930664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,4,power_law_1.01,5.150291061401367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,128,power_law_1.01,2.048409652709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,4,power_law_1.01,5.207244873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,4,power_law_1.01,5.322137451171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,4,power_law_1.01,5.413068771362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,4,power_law_1.01,5.618073654174805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,4,power_law_1.01,5.566668701171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,4,power_law_1.01,6.140723037719726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,4,power_law_1.01,6.36517105102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,4,power_law_1.01,6.727884674072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,4,power_law_1.01,7.653785705566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,4,power_law_1.01,8.781209564208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,4,power_law_1.01,9.998131561279298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,4,power_law_1.01,12.908326721191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,8,power_law_1.01,3.0941183090209963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,4,power_law_1.01,15.694630432128907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,4,power_law_1.01,21.97973175048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,4,power_law_1.01,26.664312744140624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,1,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,1,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,1,power_law_1.01,0.16998399496078492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,1,power_law_1.01,0.3543040037155151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,1,power_law_1.01,0.5064703941345214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,1,power_law_1.01,0.6897664070129395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,1,power_law_1.01,0.9424896240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,1,power_law_1.01,1.0190848350524901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,1,power_law_1.01,1.056768035888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,1,power_law_1.01,1.0924032211303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,1,power_law_1.01,1.1126784324645995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,1,power_law_1.01,1.175551986694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,1,power_law_1.01,1.175334358215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,1,power_law_1.01,1.2210176467895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,1,power_law_1.01,1.2699647903442384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,1,power_law_1.01,1.2926976203918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,1,power_law_1.01,1.3510592460632325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,1,power_law_1.01,1.4452735900878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,1,power_law_1.01,1.5560704231262208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,1,power_law_1.01,1.7291263580322265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,1,power_law_1.01,1.8749439239501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,1,power_law_1.01,2.2419456481933593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,1,power_law_1.01,2.6888191223144533
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,1,power_law_1.01,3.447603225708008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,1,power_law_1.01,3.947520065307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,1,power_law_1.01,5.462220764160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,1,power_law_1.01,7.041843414306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,2,power_law_1.01,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,2,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,2,power_law_1.01,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,2,power_law_1.01,0.11100159883499146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,2,power_law_1.01,0.20398080348968506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,2,power_law_1.01,0.31989760398864747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,2,power_law_1.01,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,2,power_law_1.01,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,2,power_law_1.01,0.3483648061752319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,2,power_law_1.01,0.35246078968048095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,2,power_law_1.01,0.36863999366760253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,2,power_law_1.01,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,2,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,2,power_law_1.01,0.4114431858062744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,2,power_law_1.01,0.4286464214324951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,2,power_law_1.01,0.44462080001831056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,2,power_law_1.01,0.47020158767700193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,2,power_law_1.01,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,2,power_law_1.01,0.6043647766113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,2,power_law_1.01,0.7471104145050049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,2,power_law_1.01,0.9119744300842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,2,power_law_1.01,1.3434880256652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,2,power_law_1.01,1.740595245361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,2,power_law_1.01,2.4180736541748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,2,power_law_1.01,3.1502336502075194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,2,power_law_1.01,4.535295867919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,2,power_law_1.01,6.161612701416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,1,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,1,power_law_1.2,0.19742720127105712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,1,power_law_1.2,0.3526655912399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,1,power_law_1.2,0.617471981048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,1,power_law_1.2,0.8707967758178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,1,power_law_1.2,1.246617603302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,1,power_law_1.2,1.8782207489013671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,1,power_law_1.2,1.94703369140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,1,power_law_1.2,2.0283391952514647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,1,power_law_1.2,2.048409652709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,1,power_law_1.2,2.1575679779052734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,1,power_law_1.2,2.3132160186767576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,1,power_law_1.2,2.294963264465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,1,power_law_1.2,2.3379968643188476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,1,power_law_1.2,2.427903938293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,1,power_law_1.2,0.32931840419769287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,1,power_law_1.2,2.4522432327270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,1,power_law_1.2,0.5482495784759521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,1,power_law_1.2,1.031987190246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,1,power_law_1.2,2.6415103912353515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,1,power_law_1.2,1.8698240280151368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,1,power_law_1.2,2.7326208114624024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,1,power_law_1.2,2.7400192260742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,1,power_law_1.2,2.837708854675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,1,power_law_1.2,3.6210689544677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,1,power_law_1.2,3.0496768951416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,1,power_law_1.2,3.3017856597900392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,1,power_law_1.2,5.761433410644531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,1,power_law_1.2,3.748659133911133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,1,power_law_1.2,5.976063919067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,1,power_law_1.2,4.216831970214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,1,power_law_1.2,6.147891235351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,1,power_law_1.2,5.244927978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,1,power_law_1.2,6.355148696899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,1,power_law_1.2,6.314598464965821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,1,power_law_1.2,6.663577270507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,1,power_law_1.2,8.430387115478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,1,power_law_1.2,6.859980773925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,1,power_law_1.2,6.981222534179688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,1,power_law_1.2,10.228530883789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,1,power_law_1.2,7.328768157958985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,1,power_law_1.2,7.399219512939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,1,power_law_1.2,7.5931648254394535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,1,power_law_1.2,7.9028160095214846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,1,power_law_1.2,8.45148162841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,1,power_law_1.2,8.721817779541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,1,power_law_1.2,9.227436828613282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,1,power_law_1.2,10.226892852783203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,1,power_law_1.2,11.475762939453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,1,power_law_1.2,12.351897430419921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,1,power_law_1.2,15.096832275390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,1,power_law_1.2,17.940480041503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,1,power_law_1.2,24.10045471191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,1,power_law_1.2,28.595608520507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,8,8,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,8,8,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,8,8,power_law_1.2,0.04300160109996796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,8,8,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,8,8,power_law_1.2,0.042387199401855466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,8,8,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,8,8,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,8,8,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,8,8,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,8,8,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,8,8,power_law_1.2,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,8,8,power_law_1.2,0.13701119422912597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,8,8,power_law_1.2,0.1282047986984253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,8,8,power_law_1.2,0.14213119745254515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,8,8,power_law_1.2,0.1959936022758484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,8,8,power_law_1.2,0.2136064052581787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,8,8,power_law_1.2,0.21872639656066895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,8,8,power_law_1.2,0.32665600776672366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,8,8,power_law_1.2,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,8,8,power_law_1.2,0.7305215835571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,8,8,power_law_1.2,0.8796159744262695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,8,8,power_law_1.2,1.2974080085754394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,8,8,power_law_1.2,1.6445440292358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,8,8,power_law_1.2,2.668339157104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,8,8,power_law_1.2,3.438796615600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,4,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,4,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,4,power_law_1.2,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,4,power_law_1.2,0.321126389503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,4,power_law_1.2,0.3905535936355591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,4,power_law_1.2,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,4,power_law_1.2,0.4646912097930908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,4,power_law_1.2,0.6129663944244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,4,power_law_1.2,0.6354944229125976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,4,power_law_1.2,0.6160384178161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,4,power_law_1.2,0.6793216228485107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,4,power_law_1.2,0.6932479858398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,4,power_law_1.2,0.6731776237487793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,4,power_law_1.2,0.6903808116912842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,4,power_law_1.2,0.7251967906951904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,4,power_law_1.2,0.7395328044891357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,4,power_law_1.2,0.8466431617736816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,4,power_law_1.2,0.8679424285888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,4,power_law_1.2,0.9349120140075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,4,power_law_1.2,1.0907648086547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,4,power_law_1.2,1.2003328323364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,4,power_law_1.2,1.5689727783203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,4,power_law_1.2,1.862860870361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,4,power_law_1.2,2.4119295120239257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,4,power_law_1.2,2.9984767913818358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,4,power_law_1.2,4.275814437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,4,power_law_1.2,5.799935913085937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,1,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,1,balanced,0.155648003021876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,1,balanced,0.34884266058603924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,1,balanced,0.6679893334706625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,1,balanced,1.307802677154541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,1,balanced,2.573823928833008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,1,balanced,2.582869370778402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,1,balanced,2.590208053588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,1,balanced,2.601616064707438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,1,balanced,2.606933275858561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,1,balanced,2.6219520568847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,1,balanced,2.6385067303975425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,1,balanced,2.6489173571268716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,1,balanced,2.6762240727742515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,1,power_law_1.01,0.36229119300842283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,1,power_law_1.01,0.6772607803344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,1,balanced,2.702335993448893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,1,power_law_1.01,1.299251174926758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,1,balanced,2.727423985799154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,1,balanced,2.7755521138509116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,1,power_law_1.01,2.5608192443847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,1,balanced,2.9731839497884116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,1,balanced,3.073866526285807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,1,power_law_1.01,3.881369781494141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,1,balanced,3.2588745752970376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,1,balanced,3.4170878728230796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,1,power_law_1.01,5.171609497070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,1,balanced,3.7019306818644204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,1,balanced,4.095472017923991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,1,power_law_1.01,7.380377960205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,1,balanced,5.02732785542806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,1,power_law_1.01,7.5978752136230465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,1,balanced,5.925546646118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,1,balanced,7.7506561279296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,1,power_law_1.01,7.885414123535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,8,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,8,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,8,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,8,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,8,power_law_1.01,0.028460800647735596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,8,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,8,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,1,balanced,9.77885882059733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,1,power_law_1.01,8.281497955322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,8,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,8,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,8,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,8,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,8,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,8,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,8,power_law_1.01,0.061612802743911746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,1,power_law_1.01,8.318975830078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,8,power_law_1.01,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,8,power_law_1.01,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,1,power_law_1.01,8.648499298095704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,8,power_law_1.01,0.11673599481582642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,1,power_law_1.01,8.861491394042968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,8,power_law_1.01,0.1525760054588318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,8,power_law_1.01,0.2027519941329956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,1,power_law_1.01,9.096601867675782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,1,power_law_1.01,9.21886749267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,8,8,power_law_1.2,5.369036865234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,1,power_law_1.01,9.219891357421876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,1,power_law_1.01,9.657958221435546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,8,power_law_1.01,0.27340800762176515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,1,power_law_1.01,10.19494400024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,1,power_law_1.01,10.117938995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,8,power_law_1.01,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,1,power_law_1.01,10.312902069091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,8,power_law_1.01,0.5582848072052002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,8,power_law_1.01,0.881049633026123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,1,power_law_1.01,11.108147430419923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,1,power_law_1.01,12.708659362792968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,1,power_law_1.01,13.9040771484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,1,power_law_1.01,17.207705688476562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,1,power_law_1.01,18.068275451660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,8,power_law_1.01,1.208524799346924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.033580800890922545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,1,power_law_1.01,23.573497009277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.13107199668884278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.045433598756790164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.3794944047927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.5830656051635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.05301759839057922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.617471981048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.6762495994567871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.6823935985565186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.6993919849395752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.7393280029296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.7602176189422607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.7720960140228271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.07802240252494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.8194047927856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.8437760353088379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.0989184021949768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.8833024024963378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.10751359462738037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.9682944297790528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,1,power_law_1.01,1.1390975952148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,1,power_law_1.01,1.310092830657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.11223039627075196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,1,power_law_1.01,1.6658432006835937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,1,power_law_1.01,28.67669677734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,1,power_law_1.01,1.9927040100097657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.19148800373077393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,1,power_law_1.01,2.7226112365722654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,1,power_law_1.01,3.522150421142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,1,power_law_1.01,5.080678558349609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,1,power_law_1.01,6.728498840332032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,1,power_law_1.01,9.967616271972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.3659456014633179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,1,power_law_1.01,13.1483642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,8,power_law_1.01,1.9998720169067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.7931903839111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,8,power_law_1.01,2.91409912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,8,8,power_law_1.2,6.90645751953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,2,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,2,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,2,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,2,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,2,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,2,balanced,0.1904639999071757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,2,balanced,0.19182932376861572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,2,balanced,0.1991680065790812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,2,balanced,0.20258132616678873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,2,balanced,0.20206934213638306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,2,balanced,0.20616533358891806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,2,balanced,0.21282132466634116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,2,balanced,0.21589332818984985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,2,balanced,0.22254933913548788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,2,balanced,0.2310826579729716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,2,balanced,0.2373973329861959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,2,balanced,0.2515626748402913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,2,balanced,0.283135990301768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,2,balanced,0.30105600754419964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,2,balanced,0.34781865278879803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,2,balanced,0.40447998046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,2,balanced,0.5394773483276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,2,balanced,0.6980266571044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,2,balanced,1.107098658879598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,1,power_law_1.2,1.245798397064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,2,balanced,1.4969174067179363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,2,balanced,2.228223959604899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,2,balanced,3.0525439580281577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,1,power_law_1.2,1.6695295333862306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,1,power_law_1.2,2.5266176223754884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,1,power_law_1.2,3.3742847442626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,128,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,128,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,128,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,128,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,128,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,128,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,128,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,128,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,128,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,128,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,128,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,128,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,128,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,128,power_law_1.01,0.038489601016044615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,128,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,128,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,128,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,128,power_law_1.01,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,128,power_law_1.01,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,128,power_law_1.01,0.12513279914855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,128,power_law_1.01,0.18124799728393554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,128,power_law_1.01,0.31825919151306153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,128,power_law_1.01,0.48353281021118166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,128,power_law_1.01,0.7251967906951904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,128,power_law_1.01,0.9596927642822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,128,power_law_1.01,1.4055423736572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,128,power_law_1.01,1.9582975387573243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,2,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,2,power_law_1.2,0.1253376007080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,2,power_law_1.2,0.2676736116409302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,2,power_law_1.2,0.3952640056610107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,2,power_law_1.2,0.45055360794067384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,2,power_law_1.2,0.7427775859832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,2,power_law_1.2,0.7933951854705811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,2,power_law_1.2,0.8409088134765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,2,power_law_1.2,0.8460288047790527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,2,power_law_1.2,0.8646656036376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,2,power_law_1.2,0.8779711723327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,2,power_law_1.2,0.8929216384887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,2,power_law_1.2,0.8976384162902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,2,power_law_1.2,0.9263104438781739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,2,power_law_1.2,0.9265151977539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,2,power_law_1.2,0.9533439636230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,2,power_law_1.2,0.9545663833618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,2,power_law_1.2,1.0035200119018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,2,power_law_1.2,1.0860544204711915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,2,power_law_1.2,1.2812288284301758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,2,power_law_1.2,1.3541376113891601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,2,power_law_1.2,1.7274688720703124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,2,power_law_1.2,1.9955711364746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,2,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,2,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,2,power_law_1.01,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,2,power_law_1.01,0.20398080348968506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,2,power_law_1.01,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,2,power_law_1.01,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,2,power_law_1.2,2.635980796813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,2,power_law_1.01,0.5412864208221435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,2,power_law_1.01,0.5459968090057373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,2,power_law_1.01,0.5435391902923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,2,power_law_1.01,0.5607423782348633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,2,power_law_1.01,0.5793791770935058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,4,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,4,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,2,power_law_1.01,0.582041597366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,4,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,4,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,2,power_law_1.01,0.6285312175750732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,4,power_law_1.01,0.107315194606781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,4,power_law_1.01,0.21626880168914794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,2,power_law_1.01,0.618291187286377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,4,power_law_1.01,0.22323200702667237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,2,power_law_1.01,0.6615039825439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,4,power_law_1.01,0.22978560924530028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,2,power_law_1.01,0.6719488143920899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,4,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,2,power_law_1.01,0.6955008029937744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,4,power_law_1.01,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,4,power_law_1.01,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,2,power_law_1.01,0.7411712169647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,4,power_law_1.01,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,4,power_law_1.01,0.2371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,2,power_law_1.01,0.7968768119812012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,4,power_law_1.01,0.24576001167297362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,4,power_law_1.01,0.2500607967376709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,2,power_law_1.01,0.8560640335083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,4,power_law_1.01,0.25927679538726806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,4,power_law_1.01,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,2,power_law_1.01,0.9904128074645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,4,power_law_1.01,0.28098559379577637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,4,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,2,power_law_1.01,1.2435456275939942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,4,power_law_1.01,0.3243839979171753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,4,power_law_1.01,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,2,power_law_1.01,1.462886428833008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,4,power_law_1.01,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,2,power_law_1.2,3.1021055221557616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,4,power_law_1.01,0.6262784004211426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,2,power_law_1.01,1.944371223449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,4,power_law_1.01,0.8386560440063476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,4,power_law_1.01,1.0272768020629883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,2,power_law_1.01,2.4260608673095705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,4,power_law_1.01,1.5851519584655762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,2,power_law_1.01,3.4883583068847654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,4,power_law_1.01,2.08670711517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,2,power_law_1.01,4.306739044189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,32,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,32,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,32,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,32,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,32,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,32,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,32,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,32,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,32,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,32,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,32,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,32,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,32,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,32,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,32,balanced,0.029685333371162415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,32,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,32,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,32,balanced,0.03617066641648611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,32,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,32,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,32,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,32,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,32,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,32,balanced,0.08994133273760478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,32,balanced,0.10342400272687276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,32,balanced,0.22425599892934164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,32,balanced,0.285866657892863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,2,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,2,balanced,0.23944532871246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,2,balanced,0.4532906611760457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,2,balanced,0.8733013470967611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.5261312007904053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,2,balanced,1.712981383005778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.6995967864990235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,2,balanced,1.7215147018432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.9082880020141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,2,balanced,1.731071949005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,2,balanced,1.7382079760233562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,1,power_law_1.2,1.6889856338500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,2,balanced,1.7455627123514812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,1,power_law_1.2,1.7305599212646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,2,balanced,1.7687840461730957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,1,power_law_1.2,1.7911808013916015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,1,power_law_1.2,1.8319360733032226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,1,power_law_1.2,1.86059513092041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,2,balanced,1.7645227114359539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,1,power_law_1.2,1.885798454284668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,2,balanced,1.7754453023274739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,2,balanced,1.7882453600565593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,1,power_law_1.2,1.9306495666503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,2,balanced,1.809066613515218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,1,power_law_1.2,2.0172800064086913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,1,power_law_1.2,1.9928895950317382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,1,power_law_1.2,2.1389312744140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,2,balanced,1.8283519744873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,2,balanced,1.8513919512430828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,2,balanced,1.9005173047383626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,1,power_law_1.2,2.203014373779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,2,balanced,1.9952640533447266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,2,balanced,2.0766612688700357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,1,power_law_1.2,2.386739158630371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,2,balanced,2.1821440060933432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,2,balanced,2.324138641357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,1,power_law_1.2,2.44531192779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,2,balanced,2.566314697265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,2,balanced,2.8695894877115884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,1,power_law_1.2,2.671615982055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,2,balanced,3.650901476542155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,2,balanced,4.472832043965657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,1,power_law_1.2,3.159040069580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,2,balanced,6.459903717041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,2,balanced,8.808789571126303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,1,power_law_1.2,3.3570816040039064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,1,power_law_1.2,4.100096130371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,2,power_law_1.2,4.345651245117187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,1,power_law_1.2,4.980531311035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,1,power_law_1.2,6.507110595703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,1,power_law_1.2,7.96569595336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,1,power_law_1.2,10.737664031982423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,2,power_law_1.2,6.085427093505859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,1,power_law_1.2,13.433651733398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,4,power_law_1.01,1.0639360427856446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,4,power_law_1.01,2.0379648208618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,4,power_law_1.01,4.098867034912109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,4,power_law_1.01,4.373286437988281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,4,power_law_1.01,6.1792255401611325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,4,power_law_1.01,7.5268096923828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,4,power_law_1.01,8.349081420898438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,4,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,4,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,4,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,4,balanced,0.2754559914271037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,4,balanced,0.5403199990590414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,4,balanced,1.0369706948598225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,4,balanced,1.0446346600850422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,4,balanced,1.0484053293863933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,4,balanced,1.0507946809132893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,4,balanced,1.055573304494222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,4,balanced,1.0600106716156006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,4,power_law_1.01,9.908627319335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,4,balanced,1.07042129834493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,4,balanced,1.0753706296284993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,4,balanced,1.0876586437225342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,4,balanced,1.1054026285807292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,4,balanced,1.1180373032887776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,4,balanced,1.1446613470713298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,4,balanced,1.2153173287709553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,4,balanced,1.27129069964091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,4,balanced,1.3866666158040364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,4,power_law_1.01,10.23815689086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,1,power_law_1.2,19.641127014160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,4,balanced,1.5298560460408528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,4,balanced,1.784981409708659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,4,balanced,2.0913492838541665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,4,balanced,2.7038612365722656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,4,power_law_1.01,10.213581085205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,4,balanced,3.217066764831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,4,balanced,4.47163740793864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,4,power_law_1.01,9.195315551757812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,4,balanced,5.600597381591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,4,power_law_1.01,10.461798095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,4,power_law_1.01,9.861529541015624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,4,power_law_1.01,10.019840240478516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,4,power_law_1.01,10.571366119384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,4,power_law_1.01,10.89249267578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,4,power_law_1.01,10.891878509521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,4,power_law_1.01,11.956224060058593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,4,power_law_1.01,11.095040130615235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,4,power_law_1.01,12.855500793457031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,4,power_law_1.01,12.920013427734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,4,power_law_1.01,14.176460266113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,4,power_law_1.01,14.957568359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,4,power_law_1.01,17.415577697753907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,4,power_law_1.01,21.15625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,4,power_law_1.01,27.774151611328126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,1,power_law_1.2,25.25184020996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,4,power_law_1.01,28.21263427734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.9193471908569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,1,power_law_1.01,1.3643775939941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,1,power_law_1.01,2.3039936065673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,1,power_law_1.01,3.520102310180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,1,power_law_1.01,3.5377151489257814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.05794559717178345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.23489279747009278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.2371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,1,power_law_1.01,3.5432254791259767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.24637439250946044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.24739840030670165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.24924159049987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.2559999942779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,1,power_law_1.01,3.7318656921386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.25661439895629884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.2594815969467163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.2695168018341064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.27463679313659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,1,power_law_1.01,4.056883239746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.29531519412994384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.2994175910949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.3555327892303467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,1,power_law_1.01,4.3720703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.4098048210144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,1,power_law_1.01,4.435148620605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,1,power_law_1.01,4.157644653320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,1,power_law_1.01,4.291993713378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.5212096214294434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,1,power_law_1.01,4.630118560791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,16,power_law_1.01,1.5939583778381348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,1,power_law_1.01,5.138022232055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,16,power_law_1.01,2.066022491455078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,16,power_law_1.01,2.0658111572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,1,power_law_1.01,5.560524749755859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,16,power_law_1.01,2.1053440093994142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,16,power_law_1.01,2.050457572937012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,1,power_law_1.01,6.03504638671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,16,power_law_1.01,1.8006015777587892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,16,power_law_1.01,1.9984384536743165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,16,power_law_1.01,1.9277631759643554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,1,power_law_1.01,7.076249694824218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,16,power_law_1.01,1.9818496704101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.6701056003570557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,16,power_law_1.01,1.9101696014404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,1,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,1,balanced,0.07458133498827617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,16,power_law_1.01,1.8786304473876954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,16,power_law_1.01,1.9484607696533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,1,power_law_1.01,8.25528335571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,16,power_law_1.01,1.9208192825317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,1,balanced,0.28996266921361286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,1,balanced,0.5370879968007406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,1,balanced,1.037823994954427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,16,power_law_1.01,2.011750411987305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,1,balanced,2.025813261667887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,1,balanced,2.037247975667318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,16,power_law_1.01,2.0590591430664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,1,balanced,2.0387840270996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,16,power_law_1.01,2.028544044494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,1,balanced,2.053973356882731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,1,balanced,2.0648959477742515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,16,power_law_1.01,2.088345527648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,1,balanced,2.0870827039082847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,1,power_law_1.01,1.0276864051818848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,1,balanced,2.111658732096354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,16,power_law_1.01,2.1385215759277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,1,balanced,2.1331626574198403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,1,balanced,2.1746346155802407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,16,power_law_1.01,2.225356864929199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,1,balanced,2.2198613484700522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,1,power_law_1.01,9.385369873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,1,balanced,2.264063994089762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,16,power_law_1.01,2.5389055252075194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,1,balanced,2.3381333351135254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,16,power_law_1.01,2.9038591384887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,1,balanced,2.497536023457845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,1,balanced,2.6613759994506836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,16,power_law_1.01,3.3339393615722654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,1,balanced,3.0057814915974936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,1,balanced,3.394048055013021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,16,power_law_1.01,3.7512897491455077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,1,balanced,4.12552547454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,1,balanced,4.769791920979817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,16,power_law_1.01,4.4886016845703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,1,power_law_1.01,10.894950103759765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,1,balanced,6.140586853027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,16,power_law_1.01,5.579776000976563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,1,balanced,7.638869603474935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,1,power_law_1.01,1.399398422241211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,16,power_law_1.01,7.9298561096191404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,1,balanced,10.672810872395834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,1,power_law_1.01,12.634317016601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,16,power_law_1.01,9.811353302001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,1,balanced,13.635242462158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,1,power_law_1.01,2.081177520751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,1,power_law_1.01,15.852339172363282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,1,power_law_1.01,18.773196411132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,1,power_law_1.01,2.7674623489379884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,1,power_law_1.01,24.8453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,1,power_law_1.01,30.54735412597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,1,power_law_1.01,4.12487678527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,1,power_law_1.01,41.0355712890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,8,power_law_1.01,0.32870399951934814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,16,power_law_1.2,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,8,power_law_1.01,0.5437439918518067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,16,power_law_1.2,0.5244927883148194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,8,power_law_1.01,0.6594560146331787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,16,power_law_1.2,0.5363711833953857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,8,power_law_1.01,0.830668830871582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,16,power_law_1.2,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,8,power_law_1.01,0.8749055862426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,16,power_law_1.2,0.5523136138916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,8,power_law_1.01,0.8658944129943847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,16,power_law_1.2,0.4997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,8,power_law_1.01,0.9113599777221679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,16,power_law_1.2,0.48824319839477537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,8,power_law_1.01,0.8904512405395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,16,power_law_1.2,0.5119999885559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,8,power_law_1.01,0.9674495697021485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,16,power_law_1.2,0.5251071929931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,8,power_law_1.01,0.9361408233642579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,16,power_law_1.2,0.5443520069122314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,8,power_law_1.01,0.8712191581726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,16,power_law_1.2,0.5175295829772949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,8,power_law_1.01,0.9048064231872559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,16,power_law_1.2,0.5310463905334473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,8,power_law_1.01,0.9433088302612305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,16,power_law_1.2,0.5390079975128174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,8,power_law_1.01,1.0168319702148438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,16,power_law_1.2,0.5478400230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,8,power_law_1.01,0.9664511680603027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,16,power_law_1.2,0.5890048027038575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,8,power_law_1.01,1.0645503997802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,16,power_law_1.2,0.5658624172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,8,power_law_1.01,1.0762240409851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,16,power_law_1.2,0.6141952037811279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,8,power_law_1.01,1.1233280181884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,16,power_law_1.2,0.6328320026397705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,8,power_law_1.01,1.1960320472717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,16,power_law_1.2,0.7002111911773682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,8,power_law_1.01,1.2922880172729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,16,power_law_1.2,0.8110079765319824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,16,power_law_1.2,1.0205183982849122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,8,power_law_1.01,1.4098431587219238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,16,power_law_1.2,1.242086410522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,8,power_law_1.01,1.6041984558105469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,16,power_law_1.2,1.4915583610534668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,8,power_law_1.01,1.9167232513427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,8,power_law_1.01,2.5200639724731446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,16,power_law_1.2,2.063360023498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,8,power_law_1.01,3.1879167556762695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,16,power_law_1.2,2.650111961364746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,8,power_law_1.01,4.738662338256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,16,power_law_1.2,4.027187347412109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,8,power_law_1.01,5.653299331665039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,16,power_law_1.2,5.082521438598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,1,power_law_1.01,5.501747131347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,8,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,8,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,8,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,8,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,8,power_law_1.2,0.031097599864006044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,8,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,8,power_law_1.2,0.032339200377464294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,8,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,8,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,8,power_law_1.2,0.03623040020465851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,8,power_law_1.2,0.039929598569869995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,8,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,8,power_law_1.2,0.05139200091361999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,8,power_law_1.2,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,8,power_law_1.2,0.08212479948997498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,8,power_law_1.2,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,8,power_law_1.2,0.12349439859390259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,8,power_law_1.2,0.1341312050819397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,8,power_law_1.2,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,1,power_law_1.01,52.05770263671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,8,power_law_1.2,0.3166208028793335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,8,power_law_1.2,0.48762879371643064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,8,power_law_1.2,0.6209536075592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,8,power_law_1.2,1.04017915725708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,8,power_law_1.2,1.4405632019042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,16,power_law_1.01,0.5988287925720215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,16,power_law_1.01,1.0571776390075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,16,power_law_1.01,1.041811180114746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,16,power_law_1.01,1.0526720046997071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,16,power_law_1.01,1.0385408401489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,16,power_law_1.01,0.9431039810180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,16,power_law_1.01,0.9082880020141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,16,power_law_1.01,0.8626175880432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,16,power_law_1.01,0.8257535934448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,16,power_law_1.01,0.8437760353088379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,16,power_law_1.01,0.9730048179626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,16,power_law_1.01,1.0188799858093263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,16,power_law_1.01,0.9375743865966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,16,power_law_1.01,1.0592255592346191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,16,power_law_1.01,0.9869312286376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,16,power_law_1.01,1.0194944381713866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,16,power_law_1.01,1.0620927810668945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,16,power_law_1.01,1.123532772064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,16,power_law_1.01,1.2093440055847169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,16,power_law_1.01,1.273855972290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,4,power_law_1.2,0.35450880527496337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,4,power_law_1.2,0.6752255916595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,16,power_law_1.01,1.3950976371765136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,4,power_law_1.2,0.7458816051483155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,16,power_law_1.01,1.6736255645751954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,4,power_law_1.2,1.0747903823852538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,4,power_law_1.2,1.2552191734313964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,16,power_law_1.01,2.092032051086426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,4,power_law_1.2,1.4741503715515136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,16,power_law_1.01,2.77258243560791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,4,power_law_1.2,2.127257537841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,4,power_law_1.2,2.152243232727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,16,power_law_1.01,3.175424003601074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,4,power_law_1.2,2.106163215637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,4,power_law_1.2,1.9611583709716798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,16,power_law_1.01,4.2340351104736325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,4,power_law_1.2,2.091417694091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,4,power_law_1.2,2.2358015060424803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,16,power_law_1.01,5.874483108520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,4,power_law_1.2,2.3459840774536134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,4,power_law_1.2,2.2575103759765627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,4,power_law_1.2,2.3597055435180665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,4,power_law_1.2,2.408243179321289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,4,power_law_1.2,2.4666112899780273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,4,power_law_1.2,2.609561538696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,4,power_law_1.2,2.718720054626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,4,power_law_1.2,2.916761589050293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,4,power_law_1.2,3.210854339599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,4,power_law_1.2,3.8443008422851563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,4,power_law_1.2,4.347699356079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,8,power_law_1.2,2.2962175369262696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,4,power_law_1.2,5.179379272460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,4,power_law_1.2,5.726003265380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,4,power_law_1.2,7.909990692138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,32,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,32,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,32,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,32,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,4,power_law_1.2,11.158118438720702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,32,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,32,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,32,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,32,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,32,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,32,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,32,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,32,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,32,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,32,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,32,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,32,power_law_1.01,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,32,power_law_1.01,0.10076160430908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,32,power_law_1.01,0.1415168046951294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,32,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,32,power_law_1.01,0.27112319469451907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,32,power_law_1.01,0.38461439609527587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,32,power_law_1.01,0.5033984184265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,32,power_law_1.01,0.7725056171417236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,32,power_law_1.01,1.207705593109131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,32,power_law_1.01,1.746944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,32,power_law_1.01,2.5016319274902346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,8,power_law_1.2,3.1551488876342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,4,power_law_1.2,0.15708160400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,4,power_law_1.2,0.14295040369033812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,4,power_law_1.2,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,4,power_law_1.2,0.2744319915771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,4,power_law_1.2,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,4,power_law_1.2,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,4,power_law_1.2,0.28280959129333494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,4,power_law_1.2,0.2869055986404419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,4,power_law_1.2,0.28815360069274903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,4,power_law_1.2,0.28733439445495607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,4,power_law_1.2,0.3104768037796021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,4,power_law_1.2,0.32030720710754396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,4,power_law_1.2,0.33216640949249265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,4,power_law_1.2,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,4,power_law_1.2,0.41451520919799806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,4,power_law_1.2,0.4247551918029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,4,power_law_1.2,0.4612095832824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,4,power_law_1.2,0.5451776027679444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,4,power_law_1.2,0.8060928344726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,4,power_law_1.2,1.0860544204711915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,4,power_law_1.2,1.2681216239929198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,4,power_law_1.2,2.029363250732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,4,power_law_1.01,0.8208383560180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,4,power_law_1.01,1.437491226196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,4,power_law_1.01,1.4528512001037597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,4,power_law_1.01,1.988198471069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,4,power_law_1.01,2.4381439208984377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,4,power_law_1.01,3.4111488342285154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,4,power_law_1.01,3.542220687866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,4,power_law_1.01,3.3538047790527346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,4,power_law_1.01,3.406438446044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,4,power_law_1.01,3.4721790313720704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,4,power_law_1.01,3.566796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,4,power_law_1.2,2.581504058837891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,4,power_law_1.01,3.7793792724609374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,4,power_law_1.01,3.8735870361328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,4,power_law_1.01,3.7994495391845704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,4,power_law_1.01,3.863961410522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,4,power_law_1.01,3.969843292236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,4,power_law_1.01,4.027596664428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,4,power_law_1.01,4.276224136352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,4,power_law_1.01,4.426342391967774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,4,power_law_1.01,4.782694244384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,4,power_law_1.01,5.436825561523437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,4,power_law_1.01,6.235136032104492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,4,power_law_1.01,7.115756988525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,4,power_law_1.01,8.91883544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,4,power_law_1.01,10.212761688232423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,4,power_law_1.01,14.009957885742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,4,power_law_1.2,3.661004638671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,4,power_law_1.01,17.685299682617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,8,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,8,balanced,0.1868799924850464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,8,balanced,0.2524159948031108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,8,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,8,balanced,0.2529279987017314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,8,balanced,0.25361067056655884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,8,balanced,0.25497599442799884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,8,balanced,0.2558293342590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,8,balanced,0.2577066620190938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,8,balanced,0.2585600018501282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,8,balanced,0.26077866554260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,8,balanced,0.26470400889714557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,8,balanced,0.26692267258961994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,8,balanced,0.27084799607594806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,8,balanced,0.26999467611312866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,8,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,8,balanced,0.29661866029103595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,8,balanced,0.32102400064468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,8,balanced,0.34508800506591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,8,balanced,0.3742719888687134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,8,balanced,0.4483413298924764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,8,balanced,0.5423786640167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,8,balanced,0.7978666623433431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,8,balanced,1.040554682413737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,1,balanced,0.2573653260866801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,1,balanced,0.44697598616282147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,1,balanced,0.8780746459960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,1,balanced,1.7225066820780437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,1,balanced,3.404965400695801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,1,balanced,3.4182507197062173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,1,balanced,3.429546674092611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,1,balanced,3.4416640599568686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,1,balanced,3.452416102091471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,1,balanced,3.4658985137939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,1,balanced,3.490133285522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,1,balanced,3.524949391682943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,1,balanced,3.5479892094930015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,1,balanced,3.590826670328776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,1,balanced,3.724954605102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,4,power_law_1.2,4.710176086425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,1,balanced,3.7606401443481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,1,balanced,3.8427305221557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,1,balanced,3.8741067250569663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,1,balanced,4.127231915791829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,1,balanced,4.287317276000977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,1,balanced,4.538026809692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,1,balanced,5.131775856018066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,1,balanced,5.657237370808919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,1,balanced,7.255893071492513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,1,balanced,9.243978500366211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,1,balanced,12.930901845296225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,1,balanced,17.32317860921224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,2,power_law_1.01,0.4622335910797119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,2,power_law_1.01,0.546611213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,2,power_law_1.01,0.5666816234588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,2,power_law_1.01,0.8462335586547851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,2,power_law_1.01,0.8886207580566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,2,power_law_1.01,0.8960000038146972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,2,power_law_1.01,0.901529598236084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,2,power_law_1.01,0.9060352325439454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,2,power_law_1.01,0.9185279846191406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,2,power_law_1.01,0.9515007972717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,2,power_law_1.01,1.0184576034545898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,2,power_law_1.01,1.0676223754882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,2,power_law_1.01,1.146675205230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,2,power_law_1.01,1.0967040061950684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,2,power_law_1.01,1.2292096138000488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,2,power_law_1.01,1.2486656188964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,2,power_law_1.01,1.3936639785766602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,2,power_law_1.01,1.6959487915039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,2,power_law_1.01,2.066431999206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,2,power_law_1.01,2.610585594177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,1,power_law_1.2,0.2959359884262085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,1,power_law_1.2,0.5056511878967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,1,power_law_1.2,0.5539840221405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,2,power_law_1.01,3.181772804260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,1,power_law_1.2,0.9967616081237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,1,power_law_1.2,0.9777152061462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,1,power_law_1.2,1.011507225036621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,1,power_law_1.2,1.042841625213623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,1,power_law_1.2,1.0483712196350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,1,power_law_1.2,1.0614656448364257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,1,power_law_1.2,1.0463232040405273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,1,power_law_1.2,1.0844032287597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,1,power_law_1.2,1.1118592262268066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,1,power_law_1.2,1.1347840309143067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,1,power_law_1.2,1.1784192085266114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,1,power_law_1.2,1.2560192108154298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,1,power_law_1.2,1.2824576377868653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,4,power_law_1.2,6.144204711914062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,1,power_law_1.2,1.3621248245239257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,1,power_law_1.2,1.6070655822753905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,1,power_law_1.2,1.8302976608276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,2,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,2,balanced,0.045909335215886436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,2,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,2,balanced,0.08243200182914734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,2,balanced,0.3054666717847188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,2,balanced,0.37700267632802326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,1,power_law_1.2,2.328166389465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,2,balanced,0.38075733184814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,2,power_law_1.01,4.516864013671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,2,balanced,0.38075733184814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,2,balanced,0.38656000296274823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,2,balanced,0.38980265458424884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,2,balanced,0.3996959924697876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,2,balanced,0.4068693319956462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,2,balanced,0.4135253429412842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,2,balanced,0.42581331729888916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,2,balanced,0.4432213306427002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,2,balanced,0.45602134863535565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,2,balanced,0.48315731684366864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,2,balanced,0.5362346569697062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,2,balanced,0.5920426845550537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,2,balanced,0.7256746292114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,2,balanced,0.8978772958119711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,2,balanced,1.2540586789449055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,2,balanced,1.5719839731852214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,2,balanced,2.238096078236898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,2,balanced,2.9356374740600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,2,balanced,4.394826571146647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,2,balanced,5.859498977661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,1,power_law_1.2,2.8854272842407225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,2,power_law_1.01,5.617459106445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,1,power_law_1.2,3.7926910400390623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,1,power_law_1.2,4.7757312774658205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,2,power_law_1.01,7.563673400878907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,4,power_law_1.2,8.631501007080079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,1,power_law_1.2,6.626303863525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,2,power_law_1.01,11.058380889892579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,128,power_law_1.2,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,128,power_law_1.2,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,128,power_law_1.2,0.28487679958343504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,128,power_law_1.2,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,128,power_law_1.2,0.24944639205932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,128,power_law_1.2,0.2520895957946777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,128,power_law_1.2,0.29180159568786623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,128,power_law_1.2,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,128,power_law_1.2,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,128,power_law_1.2,0.2959359884262085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,128,power_law_1.2,0.29818880558013916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,128,power_law_1.2,0.3028863906860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,128,power_law_1.2,0.30453760623931886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,128,power_law_1.2,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,128,power_law_1.2,0.3190464019775391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,128,power_law_1.2,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,128,power_law_1.2,0.342630410194397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,128,power_law_1.2,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,128,power_law_1.2,0.5322751998901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,128,power_law_1.2,0.7542784214019775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,128,power_law_1.2,0.9605119705200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,128,power_law_1.2,1.45797119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,128,power_law_1.2,2.1360639572143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,128,power_law_1.2,2.816819190979004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,128,power_law_1.2,4.352204895019531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,128,power_law_1.2,6.512025451660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,128,power_law_1.2,8.614502716064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,2,power_law_1.01,14.523802185058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,1,power_law_1.2,9.208422088623047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,2,power_law_1.01,19.847576904296876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,2,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,2,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,2,power_law_1.01,0.1325055956840515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,2,power_law_1.01,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,2,power_law_1.01,0.3096447944641113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,4,power_law_1.2,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,2,power_law_1.01,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,2,power_law_1.01,0.42352638244628904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,4,power_law_1.2,0.3213248014450073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,2,power_law_1.01,0.4143104076385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,2,power_law_1.01,0.4380671977996826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,4,power_law_1.2,0.393830394744873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,4,power_law_1.2,0.5351424217224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,4,power_law_1.2,0.6449151992797851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,2,power_law_1.01,0.42905597686767577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,2,power_law_1.01,0.4433919906616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,4,power_law_1.2,0.9711615562438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,2,power_law_1.01,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,2,power_law_1.01,0.4521984100341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,4,power_law_1.2,0.9121791839599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,2,power_law_1.01,0.4722559928894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,2,power_law_1.01,0.4863999843597412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,4,power_law_1.2,0.9207807540893554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,2,power_law_1.01,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,4,power_law_1.2,0.941260814666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,2,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,2,power_law_1.01,0.5320703983306885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,4,power_law_1.2,0.9310208320617676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,2,power_law_1.01,0.5652480125427246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,2,power_law_1.01,0.6486015796661377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,4,power_law_1.2,0.9586688041687011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,2,power_law_1.01,0.692633581161499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,4,power_law_1.2,0.9791359901428223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,2,power_law_1.01,0.8941568374633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,4,power_law_1.2,1.0053631782531738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,2,power_law_1.01,1.0684415817260742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,4,power_law_1.2,1.053286361694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,2,power_law_1.01,1.5015935897827148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,4,power_law_1.2,1.0999808311462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,2,power_law_1.01,1.879859161376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,4,power_law_1.2,1.1132927894592286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,4,power_law_1.2,1.1870207786560059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,2,power_law_1.01,2.6595327377319338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,4,power_law_1.2,1.267916774749756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,2,power_law_1.01,3.3699840545654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,4,power_law_1.2,1.375436782836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,4,power_law_1.2,1.6097280502319335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,4,power_law_1.2,1.8251775741577148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,4,power_law_1.2,2.2329343795776366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,4,power_law_1.2,2.6060800552368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,4,power_law_1.2,3.597516632080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,4,power_law_1.2,4.334796905517578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,4,power_law_1.2,6.4090110778808596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,1,power_law_1.2,13.184614562988282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,4,power_law_1.2,7.995801544189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,2,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,2,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,2,power_law_1.01,0.0899071991443634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,2,power_law_1.01,0.18309119939804078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,2,power_law_1.01,0.24412159919738768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,2,power_law_1.01,0.3962496042251587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,2,power_law_1.01,0.40446081161499026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,2,power_law_1.01,0.4216832160949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,2,power_law_1.01,0.4526080131530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,2,power_law_1.01,0.44417920112609866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,2,power_law_1.01,0.4657087802886963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,2,power_law_1.01,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,2,power_law_1.01,0.48496642112731936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,2,power_law_1.01,0.4907008171081543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,2,power_law_1.01,0.5101568222045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,2,power_law_1.01,0.5252863883972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,2,power_law_1.01,0.5373695850372314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,2,power_law_1.01,0.6025216102600097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,2,power_law_1.01,0.6334464073181152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,2,power_law_1.01,0.7626751899719239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,2,power_law_1.01,0.9899904251098632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,2,power_law_1.01,1.3338624000549317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,2,power_law_1.01,1.580031967163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,2,power_law_1.01,2.16494083404541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,2,power_law_1.01,2.7222015380859377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,2,power_law_1.01,4.185907363891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,2,power_law_1.01,5.917900848388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,1,power_law_1.2,17.013555908203124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,2,power_law_1.01,0.6008831977844238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,2,power_law_1.01,1.055731201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,2,power_law_1.01,1.4354432106018067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,2,power_law_1.01,2.513510322570801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,2,power_law_1.01,3.6831039428710937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,2,power_law_1.01,4.652441787719726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,2,power_law_1.01,6.427033233642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,2,power_law_1.01,5.9870849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,2,power_law_1.01,6.942105865478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,2,power_law_1.01,7.115570831298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,2,power_law_1.01,6.70044174194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,2,power_law_1.01,6.866738891601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,2,power_law_1.01,7.067436981201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,2,power_law_1.01,7.0344703674316404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,2,power_law_1.01,7.3135932922363285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,2,power_law_1.01,7.598284912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,2,power_law_1.01,7.40679702758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,2,power_law_1.01,8.077311706542968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,2,power_law_1.01,8.2384765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,2,power_law_1.01,8.715878295898438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,2,power_law_1.01,8.980480194091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,2,power_law_1.01,10.361650848388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,2,power_law_1.01,11.262566375732423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,2,power_law_1.01,13.717298889160157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,2,power_law_1.01,17.361509704589842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,16,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,16,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,16,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,16,balanced,0.23944532871246338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,16,balanced,0.457045316696167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,16,balanced,0.4561920166015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,16,balanced,0.4580693244934082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,16,balanced,0.45875199635823566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,16,balanced,0.46113598346710205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,16,balanced,0.4613120158513387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,16,balanced,0.46404266357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,16,balanced,0.46693865458170575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,16,balanced,0.46882132689158124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,16,balanced,0.47274665037790936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,16,balanced,0.48298664887746173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,16,balanced,0.48469332853953045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,16,balanced,0.4922026793162028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,16,balanced,0.48655466238657635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,16,balanced,0.5111466646194458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,16,balanced,0.5521066586176554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,16,balanced,0.5708800156911215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,16,balanced,0.6335146824518839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,16,balanced,0.6756693522135416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,16,balanced,0.8736426830291748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,16,balanced,1.0716160138448079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,16,balanced,1.6223573684692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,2,power_law_1.01,21.80034484863281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,16,balanced,2.1637120246887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,2,power_law_1.01,26.441726684570312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,2,power_law_1.2,0.8355839729309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,2,power_law_1.2,1.2156928062438965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,2,power_law_1.2,1.8966527938842774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,2,power_law_1.2,2.7635711669921874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,2,power_law_1.2,3.868057632446289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,2,power_law_1.2,6.411878204345703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,2,power_law_1.2,6.2500862121582035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,2,power_law_1.2,6.936166381835937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,2,power_law_1.2,6.9863426208496096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,2,power_law_1.2,7.340236663818359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,2,power_law_1.2,7.432396697998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,2,power_law_1.2,7.445491027832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,2,power_law_1.2,7.79345932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,2,power_law_1.2,8.08980484008789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,2,power_law_1.2,8.450662231445312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,2,power_law_1.2,8.473190307617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,2,power_law_1.2,8.930303955078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,2,power_law_1.2,8.742912292480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,2,power_law_1.2,9.514598083496093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,2,power_law_1.2,9.789234924316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,2,power_law_1.2,10.592870330810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,2,power_law_1.2,12.884991455078126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,2,power_law_1.2,13.247283935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,2,power_law_1.2,17.06946563720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,16,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,16,power_law_1.01,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,2,power_law_1.2,19.621682739257814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,16,power_law_1.01,0.2883519887924194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,16,power_law_1.01,0.27648000717163085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,16,power_law_1.01,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,16,power_law_1.01,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,16,power_law_1.01,0.26562559604644775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,16,power_law_1.01,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,16,power_law_1.01,0.26439681053161623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,16,power_law_1.01,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,16,power_law_1.01,0.2703360080718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,16,power_law_1.01,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,16,power_law_1.01,0.2789376020431519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,16,power_law_1.01,0.29921278953552244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,16,power_law_1.01,0.3172352075576782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,16,power_law_1.01,0.31436800956726074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,16,power_law_1.01,0.3264512062072754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,16,power_law_1.01,0.3565567970275879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,16,power_law_1.01,0.38645761013031005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,16,power_law_1.01,0.4550528049468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,16,power_law_1.01,0.4958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,16,power_law_1.01,0.6203392028808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,16,power_law_1.01,0.8062975883483887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,16,power_law_1.01,1.085638427734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,8,power_law_1.2,0.7520063877105713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,2,power_law_1.2,27.665408325195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,16,power_law_1.01,1.5163392066955566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,8,power_law_1.2,1.116160011291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,8,power_law_1.2,1.202175998687744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,16,power_law_1.01,2.310348892211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,8,power_law_1.2,1.508556842803955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,16,power_law_1.01,3.2923648834228514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,8,power_law_1.2,1.8130943298339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,8,power_law_1.2,1.7582080841064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,8,power_law_1.2,1.660108757019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,8,power_law_1.2,1.7541120529174805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,8,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,8,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,8,power_law_1.2,1.8595455169677735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,8,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,8,power_law_1.01,0.06369280219078063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,8,power_law_1.2,1.927168083190918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,8,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,8,power_law_1.2,1.9189632415771485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,8,power_law_1.2,1.8495487213134765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,8,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,8,power_law_1.01,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,8,power_law_1.2,1.9617792129516602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,8,power_law_1.01,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,8,power_law_1.01,0.06878719925880432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,8,power_law_1.2,2.029567909240723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,8,power_law_1.01,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,8,power_law_1.01,0.07679359912872315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,8,power_law_1.2,2.0553407669067383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,8,power_law_1.01,0.08024320006370544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,8,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,8,power_law_1.01,0.08885120153427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,8,power_law_1.2,2.0895551681518554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,8,power_law_1.01,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,8,power_law_1.01,0.10629119873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,8,power_law_1.2,2.106163215637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,8,power_law_1.01,0.11735039949417114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,8,power_law_1.01,0.17612799406051635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,8,power_law_1.01,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,8,power_law_1.2,2.2957952499389647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,8,power_law_1.01,0.24821760654449462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,8,power_law_1.01,0.3438591957092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,8,power_law_1.2,2.370560073852539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,8,power_law_1.01,0.5482495784759521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,8,power_law_1.01,0.7646975994110108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,8,power_law_1.2,2.771558380126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,8,power_law_1.01,1.3273088455200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,8,power_law_1.2,2.962841606140137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,2,power_law_1.2,32.517529296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,8,power_law_1.01,1.8362367630004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,8,power_law_1.2,3.6550655364990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,8,power_law_1.01,2.6785791397094725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,8,power_law_1.01,3.5383296966552735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,8,power_law_1.2,4.378182220458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,8,power_law_1.2,5.634867095947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,8,power_law_1.2,6.239231872558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,8,power_law_1.2,8.976793670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,8,power_law_1.2,11.0202880859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,64,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,64,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,64,power_law_1.01,0.026412799954414368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,64,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,64,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,64,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,64,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,64,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,64,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,64,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,64,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,64,power_law_1.01,0.039110401272773744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,64,power_law_1.01,0.04791040122509003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,64,power_law_1.01,0.05139840245246887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,64,power_law_1.01,0.078438401222229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,64,power_law_1.01,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,64,power_law_1.01,0.16506880521774292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,64,power_law_1.01,0.2756608009338379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,64,power_law_1.01,0.40919041633605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,64,power_law_1.01,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,64,power_law_1.01,0.9285632133483886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,64,power_law_1.01,1.2496895790100098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.5269504070281983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.8785920143127441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,2,1,power_law_1.01,1.0799103736877442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,2,1,power_law_1.01,1.927168083190918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,2,1,power_law_1.01,2.027315139770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,2,1,power_law_1.01,2.047590446472168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,2,1,power_law_1.01,2.0379648208618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,2,1,power_law_1.01,2.3214080810546873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,2,1,power_law_1.01,2.349260711669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,2,1,power_law_1.01,2.4551424026489257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,2,1,power_law_1.01,2.372198486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,2,1,power_law_1.01,2.4719295501708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,2,1,power_law_1.01,2.5206720352172853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,2,1,power_law_1.01,2.7303936004638674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,2,1,power_law_1.01,2.895462417602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,2,1,power_law_1.01,2.9566976547241213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,2,1,power_law_1.01,3.3353729248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,2,1,power_law_1.01,3.9012351989746095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,2,1,power_law_1.01,4.1299903869628904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,2,1,power_law_1.01,5.047296142578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,2,1,power_law_1.01,5.897216033935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,2,1,power_law_1.01,7.634329223632813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,2,1,power_law_1.01,9.066291046142577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,2,1,power_law_1.01,12.339814758300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,2,1,power_law_1.01,15.552102661132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,16,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,16,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,16,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,16,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,16,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,16,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,16,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,16,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,16,power_law_1.2,0.028652799129486085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,16,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,16,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,16,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,16,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,16,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,16,power_law_1.2,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,16,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,16,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,16,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,16,power_law_1.2,0.0997376024723053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,16,power_law_1.2,0.11530239582061767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,16,power_law_1.2,0.1845247983932495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,16,power_law_1.2,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,2,1,power_law_1.01,21.987942504882813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,16,power_law_1.2,0.3884927988052368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,16,power_law_1.2,0.5683199882507324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,2,1,power_law_1.01,28.557516479492186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,2,power_law_1.01,0.3772416114807129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,2,power_law_1.01,0.5617663860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,2,power_law_1.01,0.6497983932495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,2,power_law_1.01,0.908083152770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,2,power_law_1.01,0.9070591926574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,2,power_law_1.01,0.917081642150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,2,power_law_1.01,0.9259008407592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,2,power_law_1.01,0.9648127555847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,2,power_law_1.01,0.982630443572998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,2,power_law_1.01,0.9666560173034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,2,power_law_1.01,0.9777152061462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,2,power_law_1.01,1.0981375694274902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,2,power_law_1.01,1.1081472396850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,2,power_law_1.01,1.2281855583190917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,2,power_law_1.01,1.3735936164855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,2,power_law_1.01,1.3520895957946777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,16,power_law_1.2,0.8665087699890137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,2,power_law_1.01,1.5597567558288574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,2,power_law_1.01,1.8548736572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,2,power_law_1.01,2.1477376937866213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,2,power_law_1.01,2.4242176055908202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,8,power_law_1.2,0.4392831802368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,8,power_law_1.2,0.530841588973999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,8,power_law_1.2,0.628326416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,8,power_law_1.2,0.8128512382507325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,8,power_law_1.2,0.8753151893615723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,8,power_law_1.2,1.0487615585327148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,8,power_law_1.2,0.9365504264831543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,8,power_law_1.2,0.9170944213867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,8,power_law_1.2,0.9144319534301758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,8,power_law_1.2,0.9891839981079101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,8,power_law_1.2,0.994099235534668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,8,power_law_1.2,0.9660415649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,8,power_law_1.2,1.0035200119018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,2,power_law_1.01,2.7248640060424805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,8,power_law_1.2,1.0676223754882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,8,power_law_1.2,1.0342399597167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,8,power_law_1.2,1.1196415901184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,8,power_law_1.2,1.1493375778198243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,8,power_law_1.2,1.2109824180603028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,8,power_law_1.2,1.2834815979003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,8,power_law_1.2,1.5155200004577636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,2,power_law_1.01,4.392140960693359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,8,power_law_1.2,1.6123775482177733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,8,power_law_1.2,2.023833656311035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,8,power_law_1.2,2.575155258178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,8,power_law_1.2,3.2858112335205076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,1,balanced,0.5920426845550537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,1,balanced,1.0337013403574626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,1,balanced,2.024277369181315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,8,power_law_1.2,4.018790435791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,1,balanced,4.039679845174153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,1,balanced,7.963306427001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,2,power_law_1.01,5.6735679626464846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,1,balanced,15.861077626546225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,8,power_law_1.2,5.795020675659179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,1,balanced,23.755775451660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,1,balanced,23.77728017171224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,64,balanced,0.05187733471393585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,64,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,64,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,64,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,2,power_law_1.01,6.928998565673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,64,balanced,0.054272000988324486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,64,balanced,0.29781333605448407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,8,power_law_1.2,7.9808509826660154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,64,balanced,0.3002026677131653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,64,balanced,0.3017386595408122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,64,balanced,0.303439994653066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,64,balanced,0.30460800727208454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,64,balanced,0.30719999472300213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,64,balanced,0.31010133028030396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,64,balanced,0.3128319978713989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,64,balanced,0.3187999924023946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,64,balanced,0.32614399989446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,64,balanced,0.3319466710090637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,64,balanced,0.34355199337005615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,64,balanced,0.36232535044352215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,64,balanced,0.3862186670303345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,64,balanced,0.43008001645406085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,64,balanced,0.47257598241170246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,1,balanced,23.818751017252605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,64,balanced,0.556714653968811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,64,balanced,0.6219093402226766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,64,balanced,0.7906986872355143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,64,balanced,1.0342400074005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,64,balanced,1.4994773864746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,64,balanced,1.9985067049662273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,1,balanced,23.850496927897137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,2,power_law_1.01,10.178969573974609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,1,balanced,23.901865641276043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,1,balanced,23.948628743489582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,16,power_law_1.2,1.4911487579345704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,1,balanced,23.995221455891926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,1,balanced,24.09386698404948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,32,balanced,0.022869333624839783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,32,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,32,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,32,balanced,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,32,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,32,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,32,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,32,balanced,0.025087999800841015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,32,balanced,0.025242666403452556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,32,balanced,0.025258667767047882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,32,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,1,balanced,24.194196065266926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,32,balanced,0.02643733223279317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,32,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,32,balanced,0.027290667096773785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,32,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,32,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,32,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,32,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,32,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,32,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,32,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,32,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,32,balanced,0.07458133498827617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,32,balanced,0.12970667084058127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,32,balanced,0.2230613430341085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,32,balanced,0.3442346652348836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,32,balanced,0.46916266282399494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,1,balanced,24.2698237101237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,1,balanced,24.44373321533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,1,balanced,24.752980550130207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,1,balanced,25.865033467610676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,1,balanced,26.45128122965495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,2,power_law_1.01,14.470553588867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,1,balanced,27.180030822753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,1,balanced,28.43408966064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,1,balanced,47.82096862792969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,16,power_law_1.2,0.601087999343872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,16,power_law_1.2,1.0571776390075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,16,power_law_1.2,1.4962688446044923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,16,power_law_1.2,1.5394816398620605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,16,power_law_1.2,1.5583231925964356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,16,power_law_1.2,1.3832192420959473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,16,power_law_1.2,1.4110719680786132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,1,balanced,36.62370045979818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,16,power_law_1.2,1.4014464378356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,16,power_law_1.2,1.113907241821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,16,power_law_1.2,1.1304960250854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,16,power_law_1.2,1.2093440055847169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,16,power_law_1.2,1.384447956085205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,16,power_law_1.2,1.2652544021606444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,16,power_law_1.2,1.4555135726928712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,16,power_law_1.2,1.2548095703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,16,power_law_1.2,1.3928447723388673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,16,power_law_1.2,1.5165439605712892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,1,balanced,32.59015401204427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,16,power_law_1.2,1.4659584045410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,16,power_law_1.2,1.6050176620483398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,16,power_law_1.2,1.8290687561035157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,16,power_law_1.2,1.7893375396728515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,16,power_law_1.2,2.2179840087890623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,2,power_law_1.01,16.340992736816407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,16,power_law_1.2,2.7439104080200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,16,power_law_1.2,3.6259838104248048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,16,power_law_1.2,4.643014526367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,1,balanced,42.022911071777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,16,power_law_1.2,6.0727294921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,16,power_law_1.2,7.540326690673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,1,balanced,42.48405456542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,8,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,8,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,8,balanced,0.2874026695887248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,8,balanced,0.5396480162938436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,8,balanced,1.0419092973073323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,8,balanced,2.0107946395874023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,8,balanced,2.0159145991007485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,8,balanced,2.0208640098571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,8,balanced,2.0261546770731607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,8,balanced,2.0440746943155923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,8,balanced,2.0355307261149087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,8,balanced,2.045952002207438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,8,balanced,2.0529492696126304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,8,balanced,2.0662612915039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,8,balanced,2.0826452573140464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,8,balanced,2.0998826026916504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,8,balanced,2.1215573946634927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,8,balanced,2.1690026919047036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,8,balanced,2.21781333287557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,8,balanced,2.303658644358317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,8,balanced,2.4072532653808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,8,balanced,2.590720017751058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,8,balanced,2.7607040405273438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,8,balanced,3.095893224080404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,8,balanced,3.584170659383138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,8,balanced,4.948309262593587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,8,balanced,6.393514633178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,2,balanced,0.5533013343811035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,2,balanced,1.0362880229949951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,2,balanced,1.0031786759694417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,2,balanced,2.044245402018229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,2,balanced,1.8082133928934734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,2,balanced,2.0940799713134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,2,balanced,2.049509366353353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,2,balanced,3.5085652669270835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,2,balanced,2.057216008504232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,2,balanced,3.5795628229777017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,2,balanced,2.0826452573140464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,2,balanced,3.504298528035482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,2,balanced,2.094762643178304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,2,balanced,3.5131734212239585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,2,balanced,2.125823974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,2,balanced,2.1340160369873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,2,balanced,3.5264854431152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,2,balanced,2.142869313557943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,2,balanced,3.5367253621419272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,2,balanced,2.1563733418782554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,2,balanced,2.169343948364258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,2,balanced,3.6625067392985025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,2,balanced,2.18777068456014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,2,balanced,3.671722730000814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,2,balanced,3.4520479838053384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,2,balanced,3.703808148701986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,2,balanced,3.553621292114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,2,balanced,4.056576093037923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,2,balanced,3.603626569112142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,2,balanced,4.061013221740723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,2,balanced,4.962645212809245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,2,balanced,3.7814613978068032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,2,balanced,6.153216044108073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,2,balanced,6.407850901285808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,2,balanced,8.206677118937174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,2,balanced,6.506837209065755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,2,balanced,6.2706349690755205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,2,balanced,9.901738484700521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,2,balanced,9.042432149251303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,2,balanced,12.22109349568685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,2,balanced,11.220128377278646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,2,balanced,14.775296529134115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,2,balanced,15.615999857584635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,8,balanced,0.9852586587270101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,8,balanced,0.8987306753794352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,8,balanced,0.8982079823811849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,8,balanced,0.9108479817708334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,8,balanced,0.9035092989603678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,8,balanced,0.9053866863250732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,8,balanced,0.908799966176351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,8,balanced,0.9130667050679525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,8,balanced,0.9321813583374023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,2,balanced,18.53421910603841
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,8,balanced,0.935424009958903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,8,balanced,0.9407146771748861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,8,balanced,0.948906660079956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,8,balanced,0.9548799991607666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,8,balanced,0.9688746929168701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,8,balanced,1.559893290201823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,2,balanced,20.092928568522137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,8,balanced,1.5919787089029949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,8,balanced,1.6279892921447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,8,balanced,2.273109277089437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,8,balanced,2.899968147277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,8,balanced,4.348245302836101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,2,balanced,22.922922770182293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,8,balanced,5.70146115620931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,2,balanced,24.87091318766276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,8,balanced,8.309418360392252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,8,balanced,10.709674835205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,2,balanced,29.539499918619793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,2,balanced,30.29589335123698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,8,balanced,15.186602274576822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,2,power_law_1.01,0.8370176315307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,2,power_law_1.01,1.427455997467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,2,power_law_1.01,1.8962432861328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,8,balanced,18.61410140991211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,2,power_law_1.01,3.00134391784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,2,balanced,36.41393025716146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,2,power_law_1.01,3.955302429199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,2,balanced,36.367530822753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,2,power_law_1.01,6.279167938232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,8,balanced,23.58306121826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,2,power_law_1.01,6.547865295410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,2,power_law_1.01,6.7934211730957035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,2,power_law_1.01,6.8693695068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,8,balanced,26.890240987141926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,2,balanced,43.57939147949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,2,power_law_1.01,7.044915008544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,2,power_law_1.01,7.07031021118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,2,power_law_1.01,7.2052734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,2,power_law_1.01,7.388774108886719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,2,power_law_1.01,7.693312072753907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,2,power_law_1.01,7.814348602294922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,2,balanced,55.526570638020836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,2,power_law_1.01,8.001741027832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,2,power_law_1.01,8.0932861328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,2,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,2,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,2,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,2,balanced,0.06809600194295247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,2,balanced,0.2874026695887248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,2,power_law_1.01,8.560639953613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,2,balanced,0.5370879968007406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,2,balanced,0.7831892967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,2,balanced,0.7881386280059814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,2,balanced,0.7954773108164469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,2,balanced,0.7987199624379476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,2,balanced,0.8091306686401367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,2,balanced,0.822271982828776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,2,balanced,0.8325119813283285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,2,balanced,0.851967970530192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,2,balanced,0.8715946674346924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,2,balanced,0.8900266488393148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,2,power_law_1.01,8.77096939086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,2,balanced,0.9330346584320068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,2,balanced,1.0183680057525635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,2,balanced,1.1002720197041829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,2,balanced,1.2649813493092854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,2,balanced,1.4716533025105794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,2,balanced,1.8696533838907878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,2,power_law_1.01,9.241395568847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,2,balanced,2.2249813079833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,2,balanced,67.92447916666667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,2,balanced,3.00492795308431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,2,balanced,3.84665584564209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,2,power_law_1.01,10.203545379638673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,2,balanced,5.599231719970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,2,balanced,7.302997589111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,2,power_law_1.01,11.904204559326171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,2,power_law_1.01,12.916326904296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,1,balanced,0.03497066597143809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,1,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,1,balanced,0.2373973329861959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,1,balanced,0.4556800127029419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,1,balanced,0.8736373583475748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,1,balanced,0.8813227017720541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,1,balanced,0.8867839972178141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,1,balanced,0.8913919925689697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,1,balanced,0.8961706956227621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,1,balanced,0.9018026987711588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,1,balanced,0.9098239739735922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,1,balanced,0.920746644337972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,1,balanced,0.9284266630808512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,1,balanced,0.943615992863973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,1,balanced,0.9594826698303223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,1,balanced,0.9751573403676351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,1,balanced,1.005738655726115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,1,balanced,1.070250670115153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,1,balanced,1.1366399923960369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,1,balanced,1.245695988337199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,2,power_law_1.01,16.36003875732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,1,balanced,1.376922607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,1,balanced,1.6511999766031902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,1,balanced,1.9297280311584473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,1,balanced,2.4654506047566733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,1,balanced,3.0646613438924155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,1,balanced,4.367189407348633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,1,balanced,5.651109059651692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,2,power_law_1.01,19.043942260742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,2,power_law_1.01,25.57091827392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,2,power_law_1.01,32.369049072265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,2,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,2,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,2,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,2,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,2,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,2,power_law_1.2,0.20828158855438234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,2,power_law_1.2,0.232857608795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,2,power_law_1.2,0.23265280723571777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,2,power_law_1.2,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,2,power_law_1.2,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,2,power_law_1.2,0.23428480625152587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,2,power_law_1.2,0.24391679763793944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,2,power_law_1.2,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,2,power_law_1.2,0.2568192005157471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,2,power_law_1.2,0.2613248109817505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,2,power_law_1.2,0.26439681053161623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,2,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,2,power_law_1.2,0.31395199298858645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,2,power_law_1.2,0.315391993522644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,2,power_law_1.2,0.36188158988952634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,2,power_law_1.2,0.42495999336242674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,2,power_law_1.2,0.5339136123657227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,2,power_law_1.2,0.6928383827209472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,2,power_law_1.2,0.9981951713562012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,2,power_law_1.2,1.4516223907470702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,2,power_law_1.2,2.100223922729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,2,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,2,power_law_1.01,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,2,power_law_1.01,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,2,power_law_1.01,0.6799359798431397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,2,power_law_1.01,0.8861696243286132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,2,power_law_1.01,1.0764287948608398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,2,power_law_1.01,1.5589376449584962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,2,power_law_1.01,1.5941632270812989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,2,power_law_1.01,1.6928768157958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,4,power_law_1.2,0.3251967906951904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,4,power_law_1.2,0.5453824043273926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,2,power_law_1.01,1.745305633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,4,power_law_1.2,0.7972864151000977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,2,power_law_1.01,1.7960960388183593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,4,power_law_1.2,1.0792960166931151
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,2,power_law_1.01,1.826406478881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,2,power_law_1.2,2.5669631958007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,4,power_law_1.2,1.3494272232055664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,2,power_law_1.01,1.8122751235961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,4,power_law_1.2,1.8208768844604493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,2,power_law_1.01,1.8438144683837892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,2,power_law_1.01,1.9273727416992188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,4,power_law_1.2,2.0678592681884767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,2,power_law_1.01,1.9531776428222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,4,power_law_1.2,2.376908874511719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,2,power_law_1.01,2.031820869445801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,2,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,2,power_law_1.01,2.1423999786376955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,4,power_law_1.2,2.5071359634399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,2,power_law_1.01,2.2681600570678713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,4,power_law_1.2,2.371993637084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,2,balanced,0.1469439963499705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,2,balanced,0.34867199261983234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,2,power_law_1.01,2.510438346862793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,2,balanced,0.6686720053354899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,4,power_law_1.2,2.7246591567993166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,2,balanced,1.3001386324564617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,2,power_law_1.01,2.7481855392456054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,2,balanced,2.5581226348876953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,4,power_law_1.2,2.4920064926147463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,2,balanced,2.5632425944010415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,2,balanced,2.572970708211263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,2,power_law_1.01,3.2034687042236327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,4,power_law_1.2,2.290278434753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,2,balanced,2.575530687967936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,4,power_law_1.2,2.6611711502075197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,2,balanced,2.5820159912109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,2,power_law_1.01,3.8035327911376955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,2,balanced,2.590538660685221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,4,power_law_1.2,2.532352066040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,2,balanced,2.6050559679667153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,2,balanced,2.612053394317627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,2,power_law_1.01,4.8097278594970705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,4,power_law_1.2,2.7998207092285154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,2,balanced,2.630314668019613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,2,balanced,2.650965372721354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,4,power_law_1.2,2.7645952224731447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,2,balanced,2.6697333653767905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,2,power_law_1.01,5.904383850097656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,4,power_law_1.2,2.892185592651367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,2,balanced,2.7083094914754233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,2,balanced,2.851327896118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,4,power_law_1.2,3.000524711608887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,2,balanced,2.9213012059529624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,2,balanced,2.9224958419799805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,4,power_law_1.2,3.266764831542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,2,power_law_1.01,7.9431617736816404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,2,balanced,3.073024113972982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,4,power_law_1.2,3.3851390838623048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,2,balanced,3.2819201151529946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,4,power_law_1.2,3.8428672790527343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,2,balanced,3.520000139872233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,2,power_law_1.01,9.848422241210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,4,power_law_1.2,4.439033508300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,2,balanced,4.023807843526204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,4,power_law_1.2,5.532467269897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,2,balanced,4.5090131759643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,2,balanced,5.822293599446614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,4,power_law_1.2,6.462464141845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,2,balanced,7.406250635782878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,4,power_law_1.2,8.245862579345703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,4,power_law_1.2,10.260684967041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,8,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,8,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,8,power_law_1.01,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,8,power_law_1.01,0.25579519271850587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,8,power_law_1.01,0.314572811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,8,power_law_1.01,0.3532799959182739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,8,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,8,power_law_1.01,0.35717120170593264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,8,power_law_1.01,0.3487744092941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,8,power_law_1.01,0.3231744050979614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,8,power_law_1.01,0.35000319480895997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,8,power_law_1.01,0.34344959259033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,8,power_law_1.01,0.3575808048248291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,64,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,8,power_law_1.01,0.3637248039245605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,64,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,64,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,8,power_law_1.01,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,64,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,8,power_law_1.01,0.3870719909667969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,64,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,8,power_law_1.01,0.41286401748657225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,64,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,8,power_law_1.01,0.45240321159362795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,64,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,8,power_law_1.01,0.48578557968139646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,64,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,64,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,64,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,64,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,64,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,8,power_law_1.01,0.5525504112243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,64,balanced,0.060415998101234436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,64,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,64,balanced,0.053930665055910744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,64,balanced,0.05409066875775655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,64,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,64,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,64,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,64,balanced,0.054773335655530296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,8,power_law_1.01,0.6221824169158936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,64,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,64,balanced,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,64,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,64,balanced,0.061610668897628784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,64,balanced,0.06400000055631001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,64,balanced,0.07202133536338806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,64,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,64,balanced,0.09113599856694539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,64,balanced,0.09026666482289632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,64,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,64,balanced,0.19694934288660684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,64,balanced,0.20718934138615927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,64,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,64,balanced,0.2599253257115682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,64,power_law_1.2,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,64,balanced,0.29713066418965656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,64,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,64,power_law_1.2,0.07516160011291503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,64,balanced,0.37939198811848956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,8,power_law_1.01,0.851353645324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,64,power_law_1.2,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,64,balanced,0.42769066492716473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,64,power_law_1.2,0.117958402633667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,8,power_law_1.01,1.0770432472229003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,64,balanced,0.5283840099970499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,64,power_law_1.2,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,64,power_law_1.2,0.31334400177001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,64,balanced,0.632149338722229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,8,power_law_1.01,1.549721622467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,64,power_law_1.2,0.4642816066741943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,64,balanced,0.9303039709726969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,64,power_law_1.2,0.6207488059997559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,8,power_law_1.01,1.9335168838500976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,64,balanced,1.2263946533203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,64,power_law_1.2,0.9259008407592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,8,power_law_1.01,2.8841983795166017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,64,power_law_1.2,1.3017087936401368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,64,power_law_1.2,2.3265216827392576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,8,power_law_1.01,3.747020721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,64,power_law_1.2,3.1883264541625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,4,2,balanced,0.2667520046234131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,4,2,balanced,0.46865065892537433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,4,2,balanced,0.9040213425954183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,4,2,balanced,0.9065813223520914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,4,2,balanced,0.9065813223520914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,4,2,balanced,0.9108479817708334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,4,2,balanced,0.9151146411895752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,4,2,balanced,0.9185280005137125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,4,2,balanced,0.9390079975128174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,4,2,balanced,0.9417386849721273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,4,2,balanced,0.9517813523610433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,4,2,balanced,0.959658702214559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,4,2,balanced,0.965119997660319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,4,2,balanced,0.9883306821187338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,4,2,balanced,1.1182080109914143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,4,2,balanced,1.157429297765096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,4,2,balanced,1.2178773085276287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,4,2,balanced,1.576789379119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,4,2,balanced,1.849514643351237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,4,2,balanced,2.1087573369344077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,4,2,balanced,2.4144213994344077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,4,2,balanced,3.260586738586426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,4,2,balanced,4.049749374389648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,4,2,balanced,5.702314376831055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,4,2,balanced,7.225002924601237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,4,2,balanced,9.954645156860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,4,2,balanced,13.013844807942709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,16,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,16,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,16,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,16,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,16,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,16,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,16,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,16,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,16,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,16,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,16,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,16,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,16,power_law_1.2,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,16,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,16,power_law_1.2,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,16,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,16,power_law_1.2,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,16,power_law_1.2,0.10076160430908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,16,power_law_1.2,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,16,power_law_1.2,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,16,power_law_1.2,0.4237311840057373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,16,power_law_1.2,0.6430528163909912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,4,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,4,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,4,balanced,0.28074665864308673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,4,balanced,0.5430399974187216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,4,balanced,1.0397013028462727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,4,balanced,2.029226620992025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,4,balanced,3.0149974822998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,4,balanced,3.0197760264078775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,4,balanced,3.0293334325154624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,128,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,4,balanced,3.034111976623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,128,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,4,balanced,3.0431572596232095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,128,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,128,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,4,balanced,3.0516907374064126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,128,power_law_1.2,0.036627200245857236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,128,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,4,balanced,3.0605653127034507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,128,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,128,power_law_1.2,0.0389055997133255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,4,balanced,3.086336135864258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,128,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,128,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,4,balanced,3.10971736907959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,128,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,128,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,4,balanced,3.129514694213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,128,power_law_1.2,0.04545280039310455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,128,power_law_1.2,0.047065600752830505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,128,power_law_1.2,0.05118719935417175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,4,balanced,3.1556266148885093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,128,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,2,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,128,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,2,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,128,power_law_1.2,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,2,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,4,balanced,3.2312053044637046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,2,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,128,power_law_1.2,0.10279680490493774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,2,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,2,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,128,power_law_1.2,0.13803520202636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,2,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,4,balanced,3.3744214375813804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,2,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,128,power_law_1.2,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,2,power_law_1.01,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,2,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,128,power_law_1.2,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,2,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,4,balanced,3.507370630900065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,2,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,128,power_law_1.2,0.3905535936355591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,2,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,128,power_law_1.2,0.6193151950836182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,2,power_law_1.01,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,4,balanced,3.6469761530558267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,128,power_law_1.2,0.7383039951324463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,2,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,2,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,16,power_law_1.2,0.9195520401000976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,4,balanced,3.935231844584147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,128,power_law_1.2,1.3094911575317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,2,power_law_1.01,0.08253440260887146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,2,power_law_1.01,0.10301439762115479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,128,power_law_1.2,1.801215934753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,4,balanced,4.301125208536784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,2,power_law_1.01,0.13332480192184448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,4,balanced,4.7537492116292315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,4,balanced,5.238272031148274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,2,power_law_1.01,0.19516160488128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,4,balanced,6.533461252848308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,4,balanced,8.02508799235026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,2,power_law_1.01,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,2,power_law_1.01,0.38154239654541017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,2,power_law_1.01,0.5257215976715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,64,power_law_1.01,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,64,power_law_1.01,0.21707520484924317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,64,power_law_1.01,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,64,power_law_1.01,0.21647360324859619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,64,power_law_1.01,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,64,power_law_1.01,0.132096004486084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,64,power_law_1.01,0.16199040412902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,64,power_law_1.01,0.2199552059173584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,64,power_law_1.01,0.17408000230789183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,64,power_law_1.01,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,64,power_law_1.01,0.18655999898910522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,64,power_law_1.01,0.19742720127105712
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,64,power_law_1.01,0.2174976110458374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,64,power_law_1.01,0.21667840480804443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,64,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,64,power_law_1.01,0.20643839836120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,64,power_law_1.01,0.21094400882720948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,64,power_law_1.01,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,64,power_law_1.01,0.27238399982452394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,8,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,64,power_law_1.01,0.3078144073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,16,power_law_1.2,1.4266367912292481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,8,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,64,power_law_1.01,0.34897921085357664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,8,power_law_1.01,0.1052672028541565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,8,power_law_1.01,0.18391040563583375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,64,power_law_1.01,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,8,power_law_1.01,0.15749119520187377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,8,power_law_1.01,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,64,power_law_1.01,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,8,power_law_1.01,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,8,power_law_1.01,0.22650880813598634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,8,power_law_1.01,0.23736319541931153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,64,power_law_1.01,0.910540771484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,8,power_law_1.01,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,8,power_law_1.01,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,8,power_law_1.01,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,64,power_law_1.01,1.1692031860351562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,8,power_law_1.01,0.26255359649658205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,8,power_law_1.01,0.2559999942779541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,8,power_law_1.01,0.2758656024932861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,64,power_law_1.01,1.6408575057983399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,8,power_law_1.01,0.2789376020431519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,8,power_law_1.01,0.288755202293396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,8,power_law_1.01,0.3201024055480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,8,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,8,power_law_1.01,0.3221503973007202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,8,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,64,power_law_1.01,2.510233688354492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,8,power_law_1.01,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,8,power_law_1.01,0.3670016050338745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,8,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,8,power_law_1.01,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,8,power_law_1.01,0.11117440462112427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,8,power_law_1.01,0.5574656009674073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,8,power_law_1.01,0.6610943794250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,8,power_law_1.01,0.19456000328063966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,8,power_law_1.01,0.1474560022354126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,8,power_law_1.01,1.1182080268859864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,8,power_law_1.01,0.17182719707489014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,8,power_law_1.01,1.3412351608276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,8,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,8,power_law_1.01,0.17100800275802613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,8,power_law_1.01,0.1691648006439209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,8,power_law_1.01,2.025062370300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,8,power_law_1.01,0.1751039981842041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,8,power_law_1.01,0.22527999877929689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,8,power_law_1.01,3.0496768951416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,8,power_law_1.01,0.20887680053710939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,8,power_law_1.01,0.23224320411682128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,8,power_law_1.01,0.2451456069946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,8,power_law_1.01,0.26540799140930177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,8,power_law_1.01,0.314572811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,8,power_law_1.01,0.34242560863494875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,8,power_law_1.01,0.39485440254211424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,8,power_law_1.01,0.4603903770446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,8,power_law_1.01,0.6117311954498291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,8,power_law_1.01,0.7567359924316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,2,power_law_1.01,0.8808447837829589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,8,power_law_1.01,1.262387180328369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,8,power_law_1.01,1.7299455642700194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,8,power_law_1.01,2.51146240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,8,power_law_1.01,3.337625503540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,16,power_law_1.2,2.248294448852539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,2,power_law_1.01,1.202175998687744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,2,power_law_1.01,1.7520639419555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,32,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,32,power_law_1.01,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,32,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,32,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,32,power_law_1.01,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,32,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,32,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,32,power_law_1.01,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,32,power_law_1.01,0.024134400486946105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,32,power_law_1.01,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,32,power_law_1.01,0.024563199281692503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,32,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,32,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,32,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,32,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,32,power_law_1.01,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,32,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,32,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,32,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,32,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,32,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,32,power_law_1.01,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,32,power_law_1.01,0.10649600028991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,32,power_law_1.01,0.20049920082092285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,32,power_law_1.01,0.27504639625549315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,32,power_law_1.01,0.4200448036193848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,32,power_law_1.01,0.6383552074432373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,2,power_law_1.01,2.814361572265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,8,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,8,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,8,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,8,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,8,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,8,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,8,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,8,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,8,balanced,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,8,balanced,0.045221333702405296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,8,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,8,balanced,0.04724800089995066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,8,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,32,balanced,0.06654400130112965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,32,balanced,0.06690133114655812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,8,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,32,balanced,0.0653546651204427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,8,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,32,balanced,0.2851840058962504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,8,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,8,balanced,0.062122667829195656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,32,balanced,0.5422079960505167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,8,balanced,0.07048533360163371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,8,balanced,0.08055466910203297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,32,balanced,1.0451626777648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,8,balanced,0.09250133236249287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,8,balanced,0.1616213321685791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,32,balanced,1.5412640571594238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,8,balanced,0.2525706688563029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,32,balanced,1.5441919962565105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,8,balanced,0.3712000052134196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,32,balanced,1.5443305969238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,8,balanced,0.500053326288859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,32,balanced,1.5453866322835286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,8,balanced,0.8268799781799316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,32,balanced,1.5494826634724934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,32,balanced,1.5540852546691895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,8,balanced,1.2021599610646565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,32,balanced,1.5556267102559407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,32,balanced,1.562453269958496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,32,balanced,1.5703040758768718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,32,balanced,1.5749120712280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,32,balanced,1.5887360572814941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,32,balanced,1.6223252614339192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,32,balanced,1.66758394241333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,32,balanced,1.70904541015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,32,balanced,1.9462560017903645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,32,balanced,2.0101119677225747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,32,balanced,2.198186715443929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,32,balanced,2.2186667124430337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,32,balanced,2.6852585474650064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,32,balanced,3.2413012186686196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,32,balanced,4.137642542521159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,2,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,2,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,2,balanced,0.18705066045125326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,2,balanced,0.3802453279495239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,2,balanced,0.6937599976857504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,2,balanced,0.9419093132019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,2,balanced,0.9454933007558187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,2,balanced,0.9487253030141195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,2,balanced,0.9530026912689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,2,balanced,0.9560746351877848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,2,balanced,0.9620479742685953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,2,balanced,0.9678506851196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,2,balanced,0.9738240242004395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,2,balanced,0.9837226867675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,2,balanced,0.9936160246531168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,2,balanced,1.0038613478342693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,2,balanced,1.0199039777119954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,2,balanced,1.0562506516774495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,2,balanced,1.0926079750061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,2,balanced,1.1490986347198486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,2,balanced,1.222826639811198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,2,balanced,1.3624320030212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,2,balanced,1.5182506243387859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,2,balanced,1.849514643351237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,2,balanced,2.1775360107421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,2,balanced,2.9725014368693032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,4,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,4,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,4,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,4,balanced,0.029680001238981884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,4,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,4,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,4,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,4,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,4,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,4,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,4,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,2,balanced,3.9086081186930337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,4,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,4,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,4,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,4,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,4,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,4,balanced,0.09318400422732036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,4,balanced,0.08345599969228108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,4,balanced,0.14284800489743552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,4,balanced,0.16008533040682474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,4,balanced,0.24064000447591147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,4,balanced,0.33177600304285687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,4,balanced,0.4935679833094279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,4,balanced,0.7127040227254232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,4,balanced,1.0839040279388428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,4,balanced,1.45305601755778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,1,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,1,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,1,balanced,0.24081067244211832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,1,balanced,0.45497600237528485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,1,balanced,0.8702293237050375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,1,balanced,0.8779093424479166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,1,balanced,0.8845653533935547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,1,balanced,0.8903679847717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,1,balanced,0.8971947034200033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,1,balanced,0.9050453503926595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,1,balanced,0.9168213208516439
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,1,balanced,0.9314986864725748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,1,balanced,0.9662933349609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,1,balanced,0.965119997660319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,1,balanced,0.989525318145752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,1,balanced,1.0151253541310628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,1,balanced,1.0699093341827393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,1,balanced,1.1612160205841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,1,balanced,1.257813294728597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,1,balanced,1.4230186144510906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,1,balanced,1.6578559875488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,1,balanced,2.080597400665283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,1,balanced,2.4765440622965493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,1,balanced,3.2918081283569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,1,balanced,4.205050786336263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,1,balanced,6.121642430623372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,1,balanced,8.177322387695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,16,power_law_1.01,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,16,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,16,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,16,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,16,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,16,power_law_1.01,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,16,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,16,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,16,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,16,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,16,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,16,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,16,power_law_1.01,0.19251199960708618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,16,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,16,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,16,power_law_1.01,0.1474560022354126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,16,power_law_1.01,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,16,power_law_1.01,0.14766080379486085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,16,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,16,power_law_1.01,0.19517439603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,16,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,16,power_law_1.01,0.1159168004989624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,16,power_law_1.01,0.130457603931427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,16,power_law_1.01,0.0989184021949768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,16,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,16,power_law_1.01,0.09728000164031983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,16,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,16,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,16,power_law_1.01,0.1482751965522766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,16,power_law_1.01,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,16,power_law_1.01,0.15564800500869752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,16,power_law_1.01,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,16,power_law_1.01,0.12387839555740357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,16,power_law_1.01,0.16609280109405516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,16,power_law_1.01,0.1392639994621277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,16,power_law_1.01,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,16,power_law_1.01,0.1939136028289795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,16,power_law_1.01,0.3733504056930542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,16,power_law_1.01,0.18882559537887572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,16,power_law_1.01,0.4855807781219482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,16,power_law_1.01,0.20762240886688232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,16,power_law_1.01,0.21340160369873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,16,power_law_1.01,0.7204864025115967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,16,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,16,power_law_1.01,0.26071040630340575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,16,power_law_1.01,1.021331214904785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,16,power_law_1.01,0.2988032102584839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,16,power_law_1.01,0.365337610244751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,16,power_law_1.01,0.4216447830200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,16,power_law_1.01,0.5576704025268555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,16,power_law_1.01,0.7249919891357421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,16,power_law_1.01,1.1085503578186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,16,power_law_1.01,1.5159040451049806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,64,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,64,power_law_1.2,0.02988159954547882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,64,power_law_1.2,0.02988159954547882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,64,power_law_1.2,0.029676800966262816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,64,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,64,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,64,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,64,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,64,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,64,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,64,power_law_1.2,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,64,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,64,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,64,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,64,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,64,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,64,power_law_1.2,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,64,power_law_1.2,0.11325440406799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,64,power_law_1.2,0.12492799758911133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,64,power_law_1.2,0.18780159950256348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,64,power_law_1.2,0.24965119361877441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,64,power_law_1.2,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,64,power_law_1.2,0.6094848155975342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,64,power_law_1.2,1.0158080101013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,64,power_law_1.2,1.3619199752807618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,64,power_law_1.2,2.2142976760864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,8,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,8,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,8,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,8,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,8,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,8,balanced,0.04795733094215393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,8,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,8,balanced,0.0499893327554067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,8,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,8,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,8,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,8,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,8,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,8,balanced,0.058880001306533813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,8,balanced,0.0602453351020813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,8,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,8,balanced,0.08703999718030293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,8,balanced,0.16759467124938965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,8,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,8,balanced,0.2874026695887248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,8,balanced,0.3821226755777995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,8,balanced,0.4790560007095337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,8,balanced,0.7698773543039957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,8,balanced,1.0545492966969807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,8,balanced,1.7051307360331218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,8,balanced,2.3243093490600586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,2,balanced,0.222378671169281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,2,balanced,0.44407467047373456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,2,balanced,0.764415979385376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,2,balanced,1.467733383178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,2,balanced,2.8419411977132163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,2,balanced,4.041386604309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,2,balanced,4.060986518859863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,2,balanced,4.079445203145345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,2,balanced,4.096853256225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,2,balanced,4.112895965576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,2,balanced,4.142570813496907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,64,power_law_1.2,2.6603519439697267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,2,balanced,4.1731414794921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,2,balanced,4.1980587641398115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,2,balanced,4.254549344380696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,2,balanced,4.292240142822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,2,balanced,4.333056131998698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,2,balanced,4.418560028076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,2,balanced,4.602853457132976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,2,balanced,4.760234514872233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,2,balanced,5.177002588907878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,2,balanced,5.363871892293294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,2,balanced,5.93612798055013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,2,balanced,6.514858881632487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,2,balanced,7.716864267985026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,2,balanced,9.41209602355957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,2,balanced,13.27068837483724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,2,balanced,16.863914489746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,64,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,64,power_law_1.2,0.07761279940605163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,64,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,64,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,64,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,64,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,64,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,64,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,64,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,64,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,64,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,64,power_law_1.2,0.044633600115776065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,64,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,64,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,64,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,64,power_law_1.2,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,64,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,64,power_law_1.2,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,64,power_law_1.2,0.0948095977306366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,64,power_law_1.2,0.14008320569992067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,64,power_law_1.2,0.22650880813598634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,64,power_law_1.2,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,64,power_law_1.2,0.41164798736572267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,64,power_law_1.2,0.5527552127838135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,64,power_law_1.2,0.7739391803741456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,64,power_law_1.2,1.286348819732666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,64,power_law_1.2,1.8868032455444337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,8,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,8,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,8,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,8,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,8,balanced,0.18875734011332193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,8,balanced,0.19012266397476196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,8,balanced,0.1904639999071757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,8,balanced,0.19113600254058838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,8,balanced,0.1914880077044169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,8,balanced,0.19368533293406168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,8,balanced,0.19575466712315878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,8,balanced,0.1962666710217794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,8,balanced,0.19933867454528809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,8,balanced,0.20273067553838095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,8,balanced,0.2053119937578837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,8,balanced,0.20905599991480509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,8,balanced,0.22169599930445352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,8,balanced,0.23227733373641968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,8,balanced,0.24439465999603271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,8,balanced,0.27153066794077557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,8,balanced,0.3041279911994934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,8,balanced,0.35309334595998126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,8,balanced,0.474453330039978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,8,balanced,0.6292479832967123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,8,balanced,1.008128007253011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,8,balanced,1.3540693918863933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,32,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,32,balanced,0.24661332368850708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,32,balanced,0.36505599816640216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,32,balanced,0.7430826822916666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,32,balanced,1.0775893529256184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,32,balanced,1.0683733622233074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,32,balanced,1.072981357574463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,32,balanced,1.0586453278859456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,32,balanced,1.0600106716156006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,32,balanced,1.0639359951019287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,32,balanced,1.0653013388315837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,32,balanced,1.071786642074585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,32,balanced,1.074346701304118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,32,balanced,1.079973300298055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,32,balanced,1.0876586437225342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,32,balanced,1.0936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,32,balanced,1.107968012491862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,32,balanced,1.1187199751536052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,32,balanced,1.141760031382243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,32,balanced,1.1627519925435383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,32,balanced,1.2052480379740398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,32,balanced,1.3165226777394612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,32,balanced,1.3800106048583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,32,balanced,1.6974506378173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,32,balanced,1.8882560729980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,32,balanced,2.5214293797810874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,32,balanced,3.1059627532958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,1,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,1,power_law_1.2,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,1,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,1,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,1,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,1,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,1,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,1,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,1,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,1,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,1,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,1,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,1,power_law_1.2,0.07086079716682434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,1,power_law_1.2,0.07720959782600403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,1,power_law_1.2,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,1,power_law_1.2,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,1,power_law_1.2,0.16117759943008422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,1,power_law_1.2,0.20848639011383058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,1,power_law_1.2,0.25231359004974363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,1,power_law_1.2,0.32378880977630614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,1,power_law_1.2,0.3985408067703247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,1,power_law_1.2,0.5519360065460205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,8,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,8,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,8,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,8,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,8,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,8,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,8,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,8,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,8,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,8,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,8,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,8,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,8,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,8,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,8,balanced,0.036517334481080375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,8,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,8,balanced,0.04692799846331278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,8,balanced,0.0679253339767456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,8,balanced,0.07133866846561432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,8,balanced,0.10171733299891154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,8,balanced,0.19029333194096884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,8,balanced,0.3275093237559001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,8,balanced,0.43434667587280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,8,balanced,0.6577386856079102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,8,balanced,0.9026559988657633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,1,power_law_1.2,0.7376895904541015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,1,power_law_1.2,1.1503616333007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,1,power_law_1.2,1.5890432357788087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,128,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,128,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,128,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,128,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,128,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,128,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,128,power_law_1.01,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,128,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,128,power_law_1.01,0.04196479916572571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,128,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,128,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,128,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,128,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,128,power_law_1.01,0.053420799970626834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,128,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,128,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,128,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,128,power_law_1.01,0.10094079971313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,128,power_law_1.01,0.11735039949417114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,128,power_law_1.01,0.16138240098953247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,128,power_law_1.01,0.21381120681762694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,128,power_law_1.01,0.31559679508209226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,128,power_law_1.01,0.35532801151275634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,128,power_law_1.01,0.5234687805175782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,128,power_law_1.01,0.6893184185028076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,128,power_law_1.01,1.1278335571289062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,128,power_law_1.01,1.8302976608276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,1,power_law_1.2,2.5008127212524416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,32,power_law_1.2,0.22302720546722413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,32,power_law_1.2,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,32,power_law_1.2,0.20357120037078857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,32,power_law_1.2,0.11407359838485717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,32,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,32,power_law_1.2,0.12226560115814208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,32,power_law_1.2,0.15421439409255983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,32,power_law_1.2,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,32,power_law_1.2,0.18903039693832396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,32,power_law_1.2,0.18472959995269775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,32,power_law_1.2,0.2185215950012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,32,power_law_1.2,0.15831040143966674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,32,power_law_1.2,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,32,power_law_1.2,0.22917120456695556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,32,power_law_1.2,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,32,power_law_1.2,0.2318336009979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,32,power_law_1.2,0.26316161155700685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,32,power_law_1.2,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,32,power_law_1.2,0.33361918926239015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,32,power_law_1.2,0.38973441123962405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,32,power_law_1.2,0.47759361267089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,32,power_law_1.2,0.7038976192474365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,32,power_law_1.2,0.8804351806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,32,power_law_1.2,1.3355008125305177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,32,power_law_1.2,1.9433408737182618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,32,power_law_1.2,2.9663232803344726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,32,power_law_1.2,4.344627380371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,64,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,64,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,64,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,64,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,64,power_law_1.01,0.027212798595428467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,64,power_law_1.01,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,64,power_law_1.01,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,64,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,64,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,64,power_law_1.01,0.030073601007461547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,64,power_law_1.01,0.030694401264190672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,64,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,64,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,64,power_law_1.01,0.038700801134109494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,64,power_law_1.01,0.04523519873619079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,64,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,64,power_law_1.01,0.08130559921264649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,64,power_law_1.01,0.0851967990398407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,64,power_law_1.01,0.1363968014717102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,64,power_law_1.01,0.16015360355377198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,64,power_law_1.01,0.2246335983276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,64,power_law_1.01,0.3436543941497803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,64,power_law_1.01,0.5687295913696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,64,power_law_1.01,0.7763711929321289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,1,power_law_1.2,3.383091354370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,8,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,8,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,8,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,8,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,8,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,8,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,8,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,8,power_law_1.2,0.07331839799880982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,8,power_law_1.2,0.08417279720306396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,8,power_law_1.2,0.09687039852142335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,8,power_law_1.2,0.13043839931488038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,8,power_law_1.2,0.14315520524978637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,8,power_law_1.2,0.18534400463104247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,8,power_law_1.2,0.2170880079269409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,8,power_law_1.2,0.26705920696258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,8,power_law_1.2,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,8,power_law_1.2,0.43274240493774413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,8,power_law_1.2,0.5513216018676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,8,power_law_1.2,0.7833600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,16,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,16,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,16,power_law_1.01,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,16,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,16,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,16,power_law_1.01,0.05364480018615723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,8,power_law_1.2,1.024409580230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,16,power_law_1.01,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,16,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,16,power_law_1.01,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,16,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,16,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,16,power_law_1.01,0.05711359977722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,16,power_law_1.01,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,16,power_law_1.01,0.07655680179595947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,16,power_law_1.01,0.08581119775772095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,16,power_law_1.01,0.12267520427703857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,16,power_law_1.01,0.17571840286254883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,16,power_law_1.01,0.20643839836120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,16,power_law_1.01,0.25333759784698484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,16,power_law_1.01,0.2965503931045532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,16,power_law_1.01,0.3446399927139282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,16,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,16,power_law_1.01,0.6166528224945068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,16,power_law_1.01,0.9316224098205567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,16,power_law_1.01,1.348198413848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,16,power_law_1.01,2.1391359329223634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,16,power_law_1.01,2.8225536346435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,8,power_law_1.2,1.5310784339904786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.5400576114654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,1,power_law_1.01,1.0385408401489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,8,power_law_1.2,1.9206144332885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,1,power_law_1.01,1.5259648323059083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,1,power_law_1.01,2.0975616455078123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,1,power_law_1.01,2.9448192596435545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,1,power_law_1.01,3.1107072830200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,1,power_law_1.01,3.184435272216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,1,power_law_1.01,3.2841728210449217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,1,power_law_1.01,3.418521499633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,1,power_law_1.01,3.5276798248291015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,1,power_law_1.01,3.541196823120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,1,power_law_1.01,3.739033508300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,8,power_law_1.2,2.7418495178222657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,1,power_law_1.01,3.842457580566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,1,power_law_1.01,3.9600128173828124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,1,power_law_1.01,4.180992126464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,1,power_law_1.01,4.443135833740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,1,power_law_1.01,4.658176040649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,1,power_law_1.01,5.2930561065673825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,1,power_law_1.01,5.615820693969726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,1,power_law_1.01,6.7162109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,1,power_law_1.01,7.706829071044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,1,power_law_1.01,10.02209243774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,1,power_law_1.01,11.927347564697266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,1,power_law_1.01,16.957644653320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,8,power_law_1.2,3.7617664337158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,2,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,2,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,2,power_law_1.01,0.07249919772148132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,2,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,1,power_law_1.01,19.953459167480467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,2,power_law_1.01,0.25026559829711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,2,power_law_1.01,0.3932159900665283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,2,power_law_1.01,0.4104191780090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,2,power_law_1.01,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,2,power_law_1.01,0.4395008087158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,2,power_law_1.01,0.4438015937805176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,2,power_law_1.01,0.4487167835235596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,2,power_law_1.01,0.4552703857421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,2,power_law_1.01,0.48066558837890627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,2,power_law_1.01,0.48435201644897463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,2,power_law_1.01,0.49745922088623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,2,power_law_1.01,0.4956160068511963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,2,power_law_1.01,0.5214208126068115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,2,power_law_1.01,0.5539840221405029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,2,power_law_1.01,0.5765120029449463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,2,power_law_1.01,0.6643712043762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,2,power_law_1.01,0.7102464199066162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,2,power_law_1.01,0.8978431701660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,2,power_law_1.01,1.0215423583984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,2,power_law_1.01,1.4012415885925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,2,power_law_1.01,1.7057792663574218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,2,power_law_1.01,2.474803161621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,2,power_law_1.01,2.9784063339233398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,8,power_law_1.2,5.704281616210937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,32,power_law_1.01,1.0598400115966797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,32,power_law_1.01,1.5429632186889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,32,power_law_1.01,1.5357952117919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,32,power_law_1.01,1.5386624336242676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,32,power_law_1.01,1.5394816398620605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,32,power_law_1.01,1.317683219909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,32,power_law_1.01,1.07456636428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,32,power_law_1.01,1.2332799911499024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,32,power_law_1.01,1.4047231674194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,32,power_law_1.01,1.3514368057250976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,32,power_law_1.01,1.4553088188171386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,32,power_law_1.01,1.4174207687377929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,32,power_law_1.01,1.3811712265014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,32,power_law_1.01,1.3899776458740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,32,power_law_1.01,1.3815808296203613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,32,power_law_1.01,1.5177727699279786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,32,power_law_1.01,1.6297983169555663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,32,power_law_1.01,1.6930816650390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,32,power_law_1.01,1.761484718322754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,32,power_law_1.01,1.8837503433227538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,32,power_law_1.01,2.0264768600463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,32,power_law_1.01,2.4141759872436523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,32,power_law_1.01,2.9190143585205077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,32,power_law_1.01,3.462963104248047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,32,power_law_1.01,4.541849517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,32,power_law_1.01,6.571417236328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,32,power_law_1.01,9.742950439453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,8,power_law_1.2,7.495065307617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.3186624050140381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.5500927925109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,1,power_law_1.2,1.0389504432678223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,1,power_law_1.2,2.0367359161376952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,1,power_law_1.2,3.381043243408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,1,power_law_1.2,4.638489532470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,1,power_law_1.2,5.594521713256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,1,power_law_1.2,7.791206359863281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,1,power_law_1.2,8.19012451171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,1,power_law_1.2,8.454962921142577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,1,power_law_1.2,8.810905456542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,1,power_law_1.2,9.224601745605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,1,power_law_1.2,9.375334167480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,1,power_law_1.2,9.694003295898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,1,power_law_1.2,10.09459228515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,1,power_law_1.2,10.510336303710938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,1,power_law_1.2,10.844345855712891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,1,power_law_1.2,11.51651840209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,1,power_law_1.2,12.160614776611329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,1,power_law_1.2,13.261619567871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,2,power_law_1.2,0.5904384136199952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,2,power_law_1.2,0.8435711860656738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,2,power_law_1.2,1.4542847633361817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,1,power_law_1.2,13.737779235839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,2,power_law_1.2,2.2198272705078126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,2,power_law_1.2,2.7058176040649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,8,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,8,power_law_1.2,0.28590080738067625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,2,power_law_1.2,4.600627136230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,8,power_law_1.2,0.39485440254211424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,8,power_law_1.2,0.4851712226867676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,8,power_law_1.2,0.5525504112243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,2,power_law_1.2,4.796825790405274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,1,power_law_1.2,15.657965087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,8,power_law_1.2,0.7247871875762939
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,8,power_law_1.2,0.7895040035247802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,2,power_law_1.2,4.716134262084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,8,power_law_1.2,0.6811647891998291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,8,power_law_1.2,0.7188479900360107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,2,power_law_1.2,4.883238220214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,8,power_law_1.2,0.6756351947784424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,8,power_law_1.2,0.6928383827209472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,8,power_law_1.2,0.6309887886047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,2,power_law_1.2,4.846182250976563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,8,power_law_1.2,0.6164480209350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,1,power_law_1.2,16.842343139648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,8,power_law_1.2,0.6635519981384277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,8,power_law_1.2,0.7192575931549072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,2,power_law_1.2,4.990156936645508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,8,power_law_1.2,0.7665599822998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,8,power_law_1.2,0.7903232097625732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,8,power_law_1.2,0.8579071998596192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,2,power_law_1.2,5.23243522644043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,8,power_law_1.2,0.8869888305664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,8,power_law_1.2,1.0092543601989745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,8,power_law_1.2,1.072537612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,2,power_law_1.2,5.0609790802001955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,8,power_law_1.2,1.30764799118042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,2,power_law_1.2,5.230387115478516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,8,power_law_1.2,1.6572416305541993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,1,power_law_1.2,20.34483184814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,8,power_law_1.2,2.2327295303344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,2,power_law_1.2,5.368012619018555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,8,power_law_1.2,2.842419242858887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,2,power_law_1.2,5.398527908325195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,8,power_law_1.2,3.6106239318847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,2,power_law_1.2,5.417574310302735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,8,power_law_1.2,4.65162239074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,1,power_law_1.2,23.400857543945314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,2,power_law_1.2,5.9121662139892575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,2,power_law_1.2,6.128844833374023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,2,power_law_1.2,6.7178497314453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,2,power_law_1.2,7.451821136474609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,1,power_law_1.2,30.672076416015624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,2,power_law_1.2,9.26187515258789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,2,power_law_1.2,9.999974060058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,2,power_law_1.2,13.459046936035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,1,power_law_1.2,33.356390380859374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,2,power_law_1.2,15.783526611328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,2,power_law_1.2,22.652723693847655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,2,power_law_1.2,28.73753662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,2,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,2,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,2,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,2,balanced,0.1971199909845988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,2,balanced,0.4527786572774251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,2,balanced,0.45943466822306317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,2,balanced,0.4621653159459432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,2,balanced,0.4654080073038737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,2,balanced,0.4681386550267537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,2,balanced,0.46967466672261554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,2,balanced,0.47598934173583984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,2,balanced,0.4800853331883748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,2,balanced,0.48366932074228924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,2,balanced,0.4928853511810303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,2,balanced,0.5087573528289795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,2,balanced,0.5171200037002563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,2,balanced,0.5374293327331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,2,balanced,0.5862400134404501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,2,balanced,0.6244693199793497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,2,balanced,0.7307946681976318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,2,balanced,0.8507733345031738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,2,balanced,1.1583147048950195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,2,balanced,1.4160213470458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,2,balanced,2.021887938181559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,2,balanced,2.596522649129232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,2,balanced,3.8101332982381186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,2,balanced,4.928341229756673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,4,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,4,power_law_1.01,0.1435647964477539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,4,power_law_1.01,0.2076672077178955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,4,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,4,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,4,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,4,power_law_1.01,0.43048958778381347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,4,power_law_1.01,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,4,power_law_1.01,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,4,power_law_1.01,0.4612095832824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,4,power_law_1.01,0.45649919509887693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,4,power_law_1.01,0.454041576385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,4,power_law_1.01,0.4626431941986084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,4,power_law_1.01,0.4696063995361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,4,power_law_1.01,0.46940159797668457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,4,power_law_1.01,0.4808703899383545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,4,power_law_1.01,0.4878335952758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,4,power_law_1.01,0.5398528099060058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,4,power_law_1.01,0.5496831893920898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,4,power_law_1.01,0.6074368000030518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,4,power_law_1.01,0.693452787399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,4,power_law_1.01,0.85032958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,4,power_law_1.01,1.0063872337341309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,4,power_law_1.01,1.4286848068237306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,4,power_law_1.01,1.5454208374023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,4,power_law_1.01,2.208358383178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,4,power_law_1.01,2.860851287841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,8,power_law_1.01,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,8,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,8,power_law_1.01,0.027008000016212463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,8,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,8,power_law_1.01,0.027622398734092713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,8,power_law_1.01,0.03294079899787903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,8,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,8,power_law_1.01,0.03542400002479553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,8,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,8,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,8,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,8,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,8,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,8,power_law_1.01,0.0497408002614975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,8,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,8,power_law_1.01,0.09666560292243957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,8,power_law_1.01,0.10547200441360474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,8,power_law_1.01,0.14049279689788818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,8,power_law_1.01,0.17756160497665405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,4,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,4,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,4,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,4,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,4,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,4,power_law_1.01,0.02865920066833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,4,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,4,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,4,power_law_1.01,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,4,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,8,power_law_1.01,0.2711551904678345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,4,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,4,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,4,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,4,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,4,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,4,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,4,power_law_1.01,0.04975999891757965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,4,power_law_1.01,0.06287360191345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,4,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,4,power_law_1.01,0.0839680016040802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,4,power_law_1.01,0.11201280355453491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,4,power_law_1.01,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,4,power_law_1.01,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,4,power_law_1.01,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,4,power_law_1.01,0.6064127922058106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,4,power_law_1.01,1.010688018798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,4,power_law_1.01,1.4546815872192382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,8,power_law_1.01,0.3604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,8,power_law_1.01,0.5888000011444092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,8,power_law_1.01,0.8353599548339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,64,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,64,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,64,balanced,0.024400000770886738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,64,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,64,balanced,0.024746666351954143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,64,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,64,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,64,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,64,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,64,balanced,0.02628266563018163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,64,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,64,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,64,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,64,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,64,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,64,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,64,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,64,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,64,balanced,0.04283200204372406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,64,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,64,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,64,balanced,0.14079999923706055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,64,balanced,0.23398399353027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,64,balanced,0.3408213456471761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,64,balanced,0.4773546854654948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,8,power_law_1.01,1.2707839965820313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,2,power_law_1.2,0.4448256015777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,2,power_law_1.2,0.6352896213531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,2,power_law_1.2,0.9727999687194824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,2,power_law_1.2,1.391801643371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,2,power_law_1.2,1.9150848388671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,2,power_law_1.2,3.161292839050293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,2,power_law_1.2,3.390464019775391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,2,power_law_1.2,3.562086486816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,2,power_law_1.2,3.5741695404052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,2,power_law_1.2,3.6757503509521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,2,power_law_1.2,3.7953536987304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,2,power_law_1.2,3.871744155883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,2,power_law_1.2,3.9946239471435545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,2,power_law_1.2,4.1136127471923825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,2,power_law_1.2,4.25533447265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,2,power_law_1.2,4.362854385375977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,2,power_law_1.2,4.465663909912109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,2,power_law_1.2,4.650150299072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,2,power_law_1.2,4.695859146118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,8,power_law_1.01,1.7735679626464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,2,power_law_1.2,5.310873413085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,2,power_law_1.2,5.906022262573242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,2,power_law_1.2,6.992076873779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,2,power_law_1.2,7.828684997558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,2,power_law_1.2,10.304716491699219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,64,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,64,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,64,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,64,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,64,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,64,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,64,balanced,0.030368000268936157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,64,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,64,balanced,0.031199999153614044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,64,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,64,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,64,balanced,0.034272000193595886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,64,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,64,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,64,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,64,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,64,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,2,power_law_1.2,12.826419067382812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,64,balanced,0.07850666840871175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,64,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,64,balanced,0.29524266719818115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,64,balanced,0.37748265266418457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,64,balanced,0.598527987798055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,64,balanced,0.7867733637491862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,2,power_law_1.2,16.94081268310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,2,power_law_1.2,21.23345947265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,1,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,1,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,1,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,1,power_law_1.01,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,1,power_law_1.01,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,1,power_law_1.01,0.1861631989479065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,1,power_law_1.01,0.2721791982650757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,1,power_law_1.01,0.2885632038116455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,1,power_law_1.01,0.29982719421386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,1,power_law_1.01,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,1,power_law_1.01,0.315391993522644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,1,power_law_1.01,0.33361918926239015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,1,power_law_1.01,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,4,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,4,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,1,power_law_1.01,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,4,power_law_1.2,0.16957440376281738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,1,power_law_1.01,0.37355520725250246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,4,power_law_1.2,0.2582528114318848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,1,power_law_1.01,0.3950592041015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,4,power_law_1.2,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,1,power_law_1.01,0.41942400932312013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,4,power_law_1.2,0.4415487766265869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,1,power_law_1.01,0.47718400955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,1,power_law_1.01,0.5404672145843505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,1,power_law_1.01,0.6565887928009033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,1,power_law_1.01,0.8427519798278809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,4,power_law_1.2,0.41021437644958497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,1,power_law_1.01,1.178009605407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,4,power_law_1.2,0.42987518310546874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,4,power_law_1.2,0.4450047969818115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,4,power_law_1.2,0.470630407333374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,1,power_law_1.01,1.5022015571594238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,4,power_law_1.2,0.42946557998657225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,4,power_law_1.2,0.46878719329833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,1,power_law_1.01,2.11517448425293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,4,power_law_1.2,0.47411198616027833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,4,power_law_1.2,0.4888576030731201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,4,power_law_1.2,0.47902722358703614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,4,power_law_1.2,0.5072896003723144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,1,power_law_1.01,2.7465728759765624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,4,power_law_1.2,0.5167103767395019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,4,power_law_1.2,0.5173247814178467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,4,power_law_1.2,0.5834752082824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,4,power_law_1.2,0.6498303890228272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,1,power_law_1.01,4.027801513671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,4,power_law_1.2,0.7612415790557862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,4,power_law_1.2,0.9408512115478516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,4,power_law_1.2,1.0606592178344727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,1,power_law_1.01,5.38337287902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,4,power_law_1.2,1.5618047714233398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,4,power_law_1.2,1.6504831314086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,4,power_law_1.2,2.489344024658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,4,power_law_1.2,3.5448833465576173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,1,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,1,balanced,0.23859200874964395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,1,balanced,0.4532906611760457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,1,balanced,0.8796053727467855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,1,balanced,1.7256107330322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,1,balanced,1.734997272491455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,1,balanced,1.7462612787882488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,1,balanced,1.7532587051391602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,1,balanced,1.7634986241658528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,1,balanced,1.7716906865437825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,1,balanced,1.7889280319213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,1,balanced,1.80514129002889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,1,balanced,1.8213547070821126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,1,balanced,1.8474666277567546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,1,balanced,1.881941318511963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,1,balanced,1.9104426701863606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,1,balanced,1.970688025156657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,1,balanced,2.1007359822591147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,1,balanced,2.1877759297688804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,1,balanced,2.385749340057373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,1,balanced,2.6200745900472007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,1,balanced,3.07148806254069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,1,balanced,3.503957430521647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,1,balanced,4.531541188557942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,1,balanced,5.603498458862305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,1,balanced,8.235008239746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,1,balanced,11.0109011332194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,2,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,2,power_law_1.2,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,2,power_law_1.2,0.29757440090179443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,2,power_law_1.2,0.372326397895813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,2,power_law_1.2,0.41634559631347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,2,power_law_1.2,0.7819263935089111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,2,power_law_1.2,0.7960512161254882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,2,power_law_1.2,0.8353792190551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,2,power_law_1.2,0.842956829071045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,2,power_law_1.2,0.8624128341674805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,2,power_law_1.2,0.901529598236084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,2,power_law_1.2,0.9109503746032714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,2,power_law_1.2,0.880025577545166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,2,power_law_1.2,0.9285632133483886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,2,power_law_1.2,0.931430435180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,2,power_law_1.2,0.9666560173034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,2,power_law_1.2,1.0090496063232421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,2,power_law_1.2,1.0745856285095214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,2,power_law_1.2,1.1579392433166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,2,power_law_1.2,1.286143970489502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,2,power_law_1.2,1.4422016143798828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,2,power_law_1.2,1.8298879623413087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,2,power_law_1.2,2.2728704452514648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,2,power_law_1.2,3.0511104583740236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,2,power_law_1.2,3.5774463653564452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,2,power_law_1.2,5.117337417602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,2,power_law_1.2,6.967705535888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,8,power_law_1.01,0.5156864166259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,8,power_law_1.01,0.4577280044555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,8,power_law_1.01,0.46407041549682615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,8,power_law_1.01,0.46387200355529784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,8,power_law_1.01,0.4667391777038574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,8,power_law_1.01,0.4739071846008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,8,power_law_1.01,0.4753407955169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,8,power_law_1.01,0.4792319774627686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,8,power_law_1.01,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,8,power_law_1.01,0.4888576030731201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,8,power_law_1.01,0.8112128257751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,8,power_law_1.01,1.0557439804077149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,8,power_law_1.01,1.0596351623535156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,8,power_law_1.01,0.9465855598449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,8,power_law_1.01,1.1720704078674316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,8,power_law_1.01,1.2107775688171387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,8,power_law_1.01,1.516748809814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,8,power_law_1.01,2.7176959991455076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,8,power_law_1.01,2.594803237915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,8,power_law_1.01,3.808665466308594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,8,power_law_1.01,4.851097488403321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,8,power_law_1.01,6.70044174194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,8,power_law_1.2,0.5912576198577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,8,power_law_1.2,0.6260735988616943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,8,power_law_1.01,8.997869110107422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,8,power_law_1.2,0.8880000114440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,8,power_law_1.2,1.2683263778686524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,8,power_law_1.2,0.9555583953857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,8,power_law_1.2,1.1059200286865234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,8,power_law_1.2,1.2691455841064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,8,power_law_1.2,1.2990464210510253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,8,power_law_1.2,1.1831295967102051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,8,power_law_1.2,1.2686911582946778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,8,power_law_1.2,1.3049856185913087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,8,power_law_1.2,1.3895359992980958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,8,power_law_1.2,1.4034560203552247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,8,power_law_1.01,0.28608639240264894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,8,power_law_1.2,1.4221311569213868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,8,power_law_1.01,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,8,power_law_1.01,0.2770944118499756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,8,power_law_1.01,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,8,power_law_1.2,1.439129638671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,8,power_law_1.01,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,8,power_law_1.01,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,8,power_law_1.01,0.28344318866729734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,8,power_law_1.2,1.4817279815673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,8,power_law_1.01,0.28631041049957273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,8,power_law_1.01,0.3336127996444702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,8,power_law_1.2,1.4800895690917968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,8,power_law_1.01,0.33420801162719727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,8,power_law_1.01,0.5545983791351319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,8,power_law_1.2,1.5140735626220703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,8,power_law_1.01,0.582041597366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,8,power_law_1.01,0.8128512382507325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,8,power_law_1.2,1.7297407150268556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,8,power_law_1.01,0.5803775787353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,8,power_law_1.2,1.9083263397216796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,8,power_law_1.01,0.6213632106781006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,8,power_law_1.2,2.1815296173095704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,8,power_law_1.01,0.8056832313537597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,8,power_law_1.2,2.804531288146973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,8,power_law_1.01,0.6872831821441651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,8,power_law_1.01,1.0651647567749023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,8,power_law_1.2,3.965542221069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,8,power_law_1.01,1.1233280181884766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,1,8,power_law_1.01,1.063526439666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,8,power_law_1.2,4.987699127197265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,1,8,power_law_1.01,2.109440040588379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,1,8,power_law_1.01,4.089651107788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,8,power_law_1.01,1.7758207321166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,1,8,power_law_1.01,3.789004898071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,1,8,power_law_1.01,4.514611053466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,8,power_law_1.01,11.742002868652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,1,8,power_law_1.01,5.361235046386719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,8,power_law_1.01,2.294988822937012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,1,8,power_law_1.01,4.97070083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,8,power_law_1.2,6.522265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,1,8,power_law_1.01,6.010854339599609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,1,8,power_law_1.01,5.449478530883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,1,8,power_law_1.01,4.511129760742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,8,power_law_1.01,3.3699840545654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,1,8,power_law_1.01,4.625817489624024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,1,8,power_law_1.01,4.840652847290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,8,power_law_1.01,4.185907363891602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,8,power_law_1.2,8.554073333740234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,1,8,power_law_1.01,4.804390335083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,8,power_law_1.01,5.858713531494141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,1,8,power_law_1.01,4.991788864135742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,8,power_law_1.01,15.268453979492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,1,8,power_law_1.01,5.452595138549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,1,8,power_law_1.01,5.422284698486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,8,power_law_1.2,10.901503753662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,1,8,power_law_1.01,5.8953601837158205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,1,8,power_law_1.01,5.978726577758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,1,8,power_law_1.01,6.300262451171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,1,8,power_law_1.01,6.1929473876953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,1,8,power_law_1.01,6.775807952880859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,8,power_law_1.01,7.367884826660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,1,8,power_law_1.01,7.349657440185547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,1,8,power_law_1.01,8.28436508178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,1,8,power_law_1.01,9.67822723388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,1,8,power_law_1.01,11.686093139648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,1,8,power_law_1.01,16.723353576660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,32,power_law_1.2,0.3176448106765747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,32,power_law_1.2,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,32,power_law_1.2,0.4122623920440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,32,power_law_1.2,0.41205759048461915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,32,power_law_1.2,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,32,power_law_1.2,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,1,8,power_law_1.01,16.61071319580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,32,power_law_1.2,0.3911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,32,power_law_1.2,0.3551232099533081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,32,power_law_1.2,0.3891200065612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,32,power_law_1.2,0.3719167947769165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,32,power_law_1.2,0.3737600088119507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,32,power_law_1.2,0.36515839099884034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,32,power_law_1.2,0.37294080257415774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,32,power_law_1.2,0.36331520080566404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,32,power_law_1.2,0.4257791996002197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,32,power_law_1.2,0.4087808132171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,32,power_law_1.2,0.42188801765441897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,32,power_law_1.2,0.4526080131530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,32,power_law_1.2,0.43909120559692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,32,power_law_1.2,0.5211967945098877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,32,power_law_1.2,0.6363135814666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,32,power_law_1.2,0.7827455997467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,32,power_law_1.2,1.0072064399719238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,32,power_law_1.2,1.552793598175049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,32,power_law_1.2,1.8477056503295899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,32,power_law_1.2,2.5522176742553713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,32,power_law_1.2,4.183244705200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,128,balanced,0.05749866863091787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,128,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,128,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,128,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,128,balanced,0.05783466498057047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,128,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,128,balanced,0.2903040051460266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,128,balanced,0.2921813329060872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,128,balanced,0.2926773428916931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,128,balanced,0.292522668838501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,128,balanced,0.2950826684633891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,128,balanced,0.2962719996770223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,128,balanced,0.29781333605448407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,128,balanced,0.2996906638145447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,128,balanced,0.3054933349291484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,128,balanced,0.30805333455403644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,8,power_law_1.01,21.410610961914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,128,balanced,0.314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,8,power_law_1.01,11.562188720703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,128,balanced,0.328874667485555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,128,balanced,0.3403093417485555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,128,balanced,0.38229334354400635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,128,balanced,0.3824640115102132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,128,balanced,0.4792160193125407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,128,balanced,0.48264535268147785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,128,balanced,0.702122688293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,128,balanced,0.8244907061258951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,128,balanced,1.0968746344248455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,128,balanced,1.435306708017985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,1,power_law_1.01,0.6080512046813965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,1,power_law_1.01,1.0446847915649413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,1,power_law_1.01,2.027724838256836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,1,power_law_1.01,3.976601409912109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,1,power_law_1.01,7.046348571777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,1,power_law_1.01,10.178765106201173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,1,power_law_1.01,12.143206024169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,1,power_law_1.01,15.499058532714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,8,power_law_1.01,15.675801086425782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,1,power_law_1.01,16.50810852050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,1,power_law_1.01,16.650035095214843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,8,power_law_1.01,28.258712768554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,1,power_law_1.01,17.9378173828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,1,power_law_1.01,18.282701110839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,1,power_law_1.01,18.525798034667968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,1,power_law_1.01,19.260826110839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,1,power_law_1.01,19.098828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,1,power_law_1.01,20.16583709716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,1,power_law_1.01,20.84864044189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,1,power_law_1.01,21.668045043945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,1,power_law_1.01,22.55749053955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,1,power_law_1.01,23.982080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,1,power_law_1.01,24.588275146484374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,1,power_law_1.01,26.78968200683594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,1,power_law_1.01,28.2957763671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,1,power_law_1.01,32.222412109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,4,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,4,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,4,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,4,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,4,balanced,0.07816533247629802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,4,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,4,balanced,0.4106239875157674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,4,balanced,0.41881601015726727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,4,balanced,0.4210346539815267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,4,balanced,0.4242773453394572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,4,balanced,0.4242773453394572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,4,balanced,0.434005339940389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,4,balanced,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,4,balanced,0.4485119978586833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,4,balanced,0.4614826838175456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,4,balanced,0.47086934248606366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,4,balanced,0.5189973513285319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,4,balanced,0.5376000006993612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,4,balanced,0.6031359831492106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,4,balanced,0.6647466818491617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,4,balanced,0.762880007425944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,4,balanced,0.9931093056996664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,4,balanced,1.2284586429595947
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,4,balanced,1.778175989786784
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,4,balanced,2.369365374247233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,4,balanced,3.4652160008748374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,4,balanced,4.517375946044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,1,power_law_1.01,36.62889099121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,1,power_law_1.01,47.06263122558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,1,power_law_1.01,60.503656005859376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,64,power_law_1.01,0.4419583797454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,64,power_law_1.01,0.41164798736572267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,64,power_law_1.01,0.4169600009918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,64,power_law_1.01,0.4171775817871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,64,power_law_1.01,0.39280641078948975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,64,power_law_1.01,0.3516416072845459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,64,power_law_1.01,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,64,power_law_1.01,0.38766720294952395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,64,power_law_1.01,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,64,power_law_1.01,0.41635842323303224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,64,power_law_1.01,0.3975167989730835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,64,power_law_1.01,0.38807039260864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,64,power_law_1.01,0.41492481231689454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,64,power_law_1.01,0.4087808132171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,64,power_law_1.01,0.4315135955810547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,64,power_law_1.01,0.44994559288024905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,64,power_law_1.01,0.4607999801635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,64,power_law_1.01,0.4483071804046631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,64,power_law_1.01,0.5132287979125977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,64,power_law_1.01,0.5529600143432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,64,power_law_1.01,0.6352896213531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,64,power_law_1.01,0.8269824028015137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,64,power_law_1.01,0.9879551887512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,64,power_law_1.01,1.4012415885925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,64,power_law_1.01,1.701683235168457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,64,power_law_1.01,2.9526016235351564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,64,power_law_1.01,3.415449523925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,1,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,1,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,1,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,1,balanced,0.057333335280418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,1,balanced,0.23961599667867026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,1,balanced,0.24422399202982584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,1,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,1,balanced,0.2500266631444295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,1,balanced,0.25412267446517944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,1,balanced,0.25853333870569867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,1,balanced,0.26709334055582684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,1,balanced,0.2768213351567586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,1,balanced,0.2826240062713623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,1,balanced,0.3002026677131653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,1,balanced,0.31522132953008014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,1,balanced,0.3258026639620463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,1,balanced,0.3653973340988159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,1,balanced,0.4275199969609578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,1,balanced,0.5314559936523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,1,balanced,0.7799466451009115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,1,balanced,1.0395306746164958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,1,balanced,1.5132959683736165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,1,balanced,2.011301358540853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,1,balanced,3.064490636189779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,1,balanced,4.156245231628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,1,balanced,6.306986490885417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,1,balanced,8.375466664632162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,1,power_law_1.01,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,1,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,1,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,1,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,1,power_law_1.01,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,1,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,1,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,1,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,1,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,1,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,1,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,1,power_law_1.01,0.06469759941101075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,1,power_law_1.01,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,1,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,1,power_law_1.01,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,1,power_law_1.01,0.10833920240402221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,1,power_law_1.01,0.156876802444458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,1,power_law_1.01,0.21524479389190673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,1,power_law_1.01,0.26357760429382326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,1,power_law_1.01,0.3205120086669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,1,power_law_1.01,0.4196352005004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,1,power_law_1.01,0.6449151992797851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,16,balanced,0.03342933456103007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,16,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,16,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,16,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,16,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,16,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,16,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,16,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,16,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,16,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,16,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,16,balanced,0.04351999859015147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,16,balanced,0.04504533112049103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,16,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,16,balanced,0.04863999783992767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,16,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,16,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,16,balanced,0.06434133152167003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,16,balanced,0.07577600081761678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,16,balanced,0.08482133348782857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,16,balanced,0.13226667046546936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,1,power_law_1.01,0.8652799606323243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,16,balanced,0.18363734086354574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,16,balanced,0.30003199974695843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,16,balanced,0.3375786542892456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,16,balanced,0.5420373280843099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,16,balanced,0.7425706386566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,1,power_law_1.01,1.3488127708435058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,16,8,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,16,8,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,16,8,power_law_1.01,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,16,8,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,16,8,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,16,8,power_law_1.01,0.03621760010719299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,16,8,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,16,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,16,8,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,16,8,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,16,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,16,8,power_law_1.01,0.04297600090503693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,16,8,power_law_1.01,0.04750080108642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,16,8,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,16,8,power_law_1.01,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,16,8,power_law_1.01,0.08499199748039246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,16,8,power_law_1.01,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,16,8,power_law_1.01,0.1372159957885742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,16,8,power_law_1.01,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,16,8,power_law_1.01,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,16,8,power_law_1.01,0.25927679538726806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,1,power_law_1.01,1.900339126586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,16,8,power_law_1.01,0.42595200538635253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,16,8,power_law_1.01,0.5498879909515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,16,8,power_law_1.01,0.8820735931396484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,1,power_law_1.01,2.912646484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,16,8,power_law_1.01,1.1806719779968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,1,power_law_1.01,3.9405567169189455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,16,8,power_law_1.01,1.8769920349121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,16,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,16,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,16,balanced,0.2908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,16,balanced,0.5507413148880005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,16,balanced,0.9094826380411783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,16,balanced,1.077077309290568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,16,balanced,1.0804906686147053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,16,balanced,1.0676906903584797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,16,balanced,1.0693973700205486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,16,balanced,1.0714453061421711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,16,balanced,1.0763946374257405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,16,balanced,1.0827093124389648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,16,balanced,1.087829351425171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,16,balanced,1.0951680342356365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,16,balanced,1.1048959891001384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,16,balanced,1.1146240234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,16,balanced,1.1328852971394856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,16,balanced,1.14738130569458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,16,balanced,1.1728213628133137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,16,balanced,1.2194133599599202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,16,balanced,1.2815360228220622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,16,balanced,1.4112426439921062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,16,balanced,1.542143980662028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,16,balanced,1.87391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,16,balanced,2.212010701497396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,16,balanced,2.9972480138142905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,16,balanced,3.7121706008911133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,16,8,power_law_1.01,2.5888704299926757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,4,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,4,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,4,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,4,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,4,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,4,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,4,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,4,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,4,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,4,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,4,power_law_1.2,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,4,power_law_1.2,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,4,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,4,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,4,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,4,power_law_1.2,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,4,power_law_1.2,0.09502720236778259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,4,power_law_1.2,0.11386879682540893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,4,power_law_1.2,0.1509376049041748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,4,power_law_1.2,0.2568192005157471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,32,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,32,power_law_1.01,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,32,power_law_1.01,0.2136064052581787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,4,power_law_1.2,0.4200448036193848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,32,power_law_1.01,0.21299200057983397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,32,power_law_1.01,0.21422080993652343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,32,power_law_1.01,0.12984319925308227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,32,power_law_1.01,0.15175679922103882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,32,power_law_1.01,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,32,power_law_1.01,0.17592320442199708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,32,power_law_1.01,0.16732159852981568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,32,power_law_1.01,0.19189759492874145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,32,power_law_1.01,0.15708160400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,32,power_law_1.01,0.19640320539474487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,32,power_law_1.01,0.19169280529022217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,32,power_law_1.01,0.18677760362625123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,32,power_law_1.01,0.2091007947921753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,32,power_law_1.01,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,32,power_law_1.01,0.22507519721984864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,32,power_law_1.01,0.2678783893585205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,32,power_law_1.01,0.2899967908859253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,32,power_law_1.01,0.35819520950317385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,32,power_law_1.01,0.42946557998657225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,32,power_law_1.01,0.5644288063049316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,32,power_law_1.01,0.8177663803100585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,32,power_law_1.01,1.3039615631103516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,32,power_law_1.01,1.8274303436279298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,32,power_law_1.01,2.1786624908447267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,4,power_law_1.2,0.4937727928161621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,16,balanced,0.03515200068553289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,16,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,16,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,16,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,16,balanced,0.0405973345041275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,16,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,16,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,16,balanced,0.04195733368396759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,16,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,16,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,16,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,16,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,16,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,16,balanced,0.048469334840774536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,16,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,16,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,16,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,16,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,16,balanced,0.07492266595363617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,16,balanced,0.08499200145403545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,16,balanced,0.11281067132949829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,16,balanced,0.14114133516947427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,16,balanced,0.2867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,16,balanced,0.3643733263015747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,4,power_law_1.2,0.788479995727539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,16,balanced,0.5307733217875162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,16,balanced,0.7553653717041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,4,power_law_1.2,1.223475170135498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,1,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,1,power_law_1.01,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,1,power_law_1.01,0.18042880296707153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,1,power_law_1.01,0.30556159019470214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,1,power_law_1.01,0.43843841552734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,1,power_law_1.01,0.7469056129455567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,1,power_law_1.01,0.7997439861297607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,1,power_law_1.01,0.7878655910491943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,1,power_law_1.01,0.8351743698120118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,1,power_law_1.01,0.8683135986328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,1,power_law_1.01,0.8716287612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,1,power_law_1.01,0.8837120056152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,1,power_law_1.01,0.9224191665649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,1,power_law_1.01,0.9299967765808106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,1,power_law_1.01,0.9687040328979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,1,power_law_1.01,0.9787391662597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,1,power_law_1.01,1.0375167846679687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,1,power_law_1.01,1.075814437866211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,1,power_law_1.01,1.1294719696044921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,1,power_law_1.01,1.2388031959533692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,1,power_law_1.01,1.4301183700561524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,1,power_law_1.01,1.7334272384643554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,1,power_law_1.01,1.9576831817626954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,1,power_law_1.01,2.5378816604614256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,1,power_law_1.01,3.1698944091796877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,1,power_law_1.01,4.469555282592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,1,power_law_1.01,5.590220642089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,4,power_law_1.2,1.8313215255737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,8,power_law_1.01,0.45708799362182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,8,power_law_1.01,0.5879807949066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,8,power_law_1.01,0.7057407855987549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,8,power_law_1.01,0.8140800476074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,8,power_law_1.01,0.5516992092132569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,8,power_law_1.01,0.7161856174468995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,8,power_law_1.01,0.8761343955993652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,8,power_law_1.01,0.8480640411376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,8,power_law_1.01,0.8962047576904297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,8,power_law_1.01,0.8591360092163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,8,power_law_1.01,0.89169921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,8,power_law_1.01,0.8935423851013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,8,power_law_1.01,0.9215999603271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,8,power_law_1.01,0.9428928375244141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,8,power_law_1.01,0.9574399948120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,8,power_law_1.01,0.9635583877563476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,8,power_law_1.01,0.9750528335571289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,8,power_law_1.01,0.9864895820617676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,8,power_law_1.01,1.045299243927002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,8,power_law_1.01,1.3141759872436523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,8,power_law_1.01,1.5052800178527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,8,power_law_1.01,2.1995519638061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,8,power_law_1.01,2.0197376251220702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,8,power_law_1.01,2.975948715209961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,8,power_law_1.01,3.6597759246826174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,8,power_law_1.01,5.43109130859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,8,power_law_1.01,7.669760131835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,4,power_law_1.2,2.4168447494506835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,2,power_law_1.2,0.20992000102996827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,2,power_law_1.2,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,2,power_law_1.2,0.32276480197906493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,2,power_law_1.2,0.5056511878967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,2,power_law_1.2,0.5322751998901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,2,power_law_1.2,0.5124095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,2,power_law_1.2,0.5525504112243652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,2,power_law_1.2,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,2,power_law_1.2,0.5736447811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,2,power_law_1.2,0.5791744232177735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,2,power_law_1.2,0.5646336078643799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,2,power_law_1.2,0.6016831874847413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,2,power_law_1.2,0.6000639915466308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,2,power_law_1.2,0.5844992160797119
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,2,power_law_1.2,0.6428671836853027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,2,power_law_1.2,0.7049215793609619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,2,power_law_1.2,0.7809023857116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,2,power_law_1.2,0.9172991752624512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,2,power_law_1.2,1.0496000289916991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,2,power_law_1.2,1.4768128395080566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,2,power_law_1.2,1.6154624938964843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,2,power_law_1.2,2.4328191757202147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,2,power_law_1.2,2.9861888885498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,2,power_law_1.2,3.7787647247314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,1,balanced,0.026965332527955372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,1,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,1,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,1,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,1,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,1,balanced,0.03054933249950409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,1,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,1,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,1,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,1,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,1,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,1,balanced,0.03703466554482778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,1,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,1,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,1,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,1,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,1,balanced,0.06297599772612254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,1,balanced,0.09079466263453166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,1,balanced,0.10734933614730835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,1,balanced,0.19473065932591757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,1,balanced,0.25565866629282635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,1,balanced,0.3831466833750407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,1,balanced,0.5116586685180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,1,balanced,0.8234666983286539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,1,balanced,1.1139413515726726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,1,balanced,1.7664000193277996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,1,balanced,2.47432533899943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,2,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,2,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,2,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,2,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,2,balanced,0.15018666783968607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,2,balanced,0.3573760191599528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,2,balanced,0.3595946629842122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,2,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,2,balanced,0.3577173153559367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,2,balanced,0.3604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,2,balanced,0.36556800206502277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,2,balanced,0.3720533450444539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,2,balanced,0.3766293525695801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,2,balanced,0.3838293155034383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,2,balanced,0.39236267407735187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,2,balanced,0.4010666608810425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,2,balanced,0.4169280131657918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,2,balanced,0.4503893454869588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,2,balanced,0.4790613253911336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,2,balanced,0.5454506476720175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,2,balanced,0.6248000065485636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,2,balanced,0.8311466375986735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,2,balanced,1.0533546606699626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,2,balanced,1.5056212743123372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,2,balanced,1.9742719332377117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,2,balanced,2.907477378845215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,2,balanced,3.8423894246419272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,2,power_law_1.2,5.262131118774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,2,power_law_1.2,8.861491394042968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,8,power_law_1.01,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,8,power_law_1.01,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,8,power_law_1.01,0.5437439918518067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,8,power_law_1.01,0.5279744148254395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,8,power_law_1.01,0.6420479774475097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,8,power_law_1.01,0.7366655826568603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,8,power_law_1.01,0.6948863983154296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,8,power_law_1.01,0.7561215877532959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,8,power_law_1.01,0.7233535766601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,8,power_law_1.01,0.6412288188934326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,8,power_law_1.01,0.653926420211792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,8,power_law_1.01,0.6881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,8,power_law_1.01,0.7254015922546386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,8,power_law_1.01,0.6752255916595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,8,power_law_1.01,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,8,power_law_1.01,0.7473152160644532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,8,power_law_1.01,0.7544832229614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,8,power_law_1.01,0.7868415832519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,8,power_law_1.01,0.8390656471252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,8,power_law_1.01,0.9537535667419433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,8,power_law_1.01,1.0827775955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,8,power_law_1.01,1.2230655670166015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,8,power_law_1.01,1.5173631668090821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,8,power_law_1.01,2.064793586730957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,8,power_law_1.01,0.24412159919738768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,8,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,8,power_law_1.01,2.4989696502685548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,8,power_law_1.01,0.29122560024261473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,8,power_law_1.01,0.3401727914810181
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,8,power_law_1.01,0.34201600551605227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,8,power_law_1.01,0.43048958778381347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,8,power_law_1.01,0.4339712142944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,8,power_law_1.01,3.4244609832763673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,8,power_law_1.01,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,8,power_law_1.01,0.42598400115966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,8,power_law_1.01,0.45465598106384275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,8,power_law_1.01,0.42803201675415037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,8,power_law_1.01,0.466534423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,8,power_law_1.01,4.673535919189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,8,power_law_1.01,0.45996799468994143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,8,power_law_1.01,0.4675583839416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,8,power_law_1.01,0.47329277992248536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,8,power_law_1.01,0.4888576030731201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,8,power_law_1.01,0.5058559894561767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,8,power_law_1.01,0.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,8,power_law_1.01,0.5701632022857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,8,power_law_1.01,0.618291187286377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,8,power_law_1.01,0.7712639808654785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,8,power_law_1.01,0.9984000205993653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,8,power_law_1.01,1.1053055763244628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,8,power_law_1.01,1.6754688262939452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,8,power_law_1.01,2.2017791748046873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,2,8,power_law_1.01,3.3765377044677733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,2,8,power_law_1.01,4.407910537719727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,32,power_law_1.01,0.05221760272979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,32,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,32,power_law_1.01,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,32,power_law_1.01,0.045049598813056944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,32,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,32,power_law_1.01,0.040320000052452086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,32,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,32,power_law_1.01,0.04195840060710907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,32,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,32,power_law_1.01,0.041971200704574586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,32,power_law_1.01,0.04257279932498932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,32,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,32,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,32,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,32,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,32,power_law_1.01,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,32,power_law_1.01,0.0644927978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,32,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,32,power_law_1.01,0.09356160163879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,32,power_law_1.01,0.1146880030632019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,32,power_law_1.01,0.132915198802948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,32,power_law_1.01,0.237772798538208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,32,power_law_1.01,0.31496319770812986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,32,power_law_1.01,0.4335616111755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,32,power_law_1.01,0.5658624172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,32,power_law_1.01,0.8650752067565918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,2,power_law_1.2,11.947622680664063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,32,power_law_1.01,1.1806719779968262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,32,power_law_1.2,0.5998464107513428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,32,power_law_1.2,0.5390336036682128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,32,power_law_1.2,0.558080005645752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,32,power_law_1.2,0.5447679996490479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,32,power_law_1.2,0.37416958808898926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,32,power_law_1.2,0.4366335868835449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,32,power_law_1.2,0.5013504028320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,32,power_law_1.2,0.4966400146484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,32,power_law_1.2,0.5238783836364747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,32,power_law_1.2,0.5015552043914795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,32,power_law_1.2,0.5294079780578613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,32,power_law_1.2,0.4607935905456543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,32,power_law_1.2,0.5388288021087646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,32,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,32,power_law_1.2,0.5490687847137451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,32,power_law_1.2,0.571392011642456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,32,power_law_1.2,0.5939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,32,power_law_1.2,0.6506495952606202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,32,power_law_1.2,0.692633581161499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,32,power_law_1.2,0.8538111686706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,32,power_law_1.2,1.001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,32,power_law_1.2,1.3174783706665039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,32,power_law_1.2,1.6338560104370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,32,power_law_1.2,2.3496383666992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,32,power_law_1.2,2.8876800537109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,32,power_law_1.2,4.961875152587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,32,power_law_1.2,6.221823883056641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,1,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,1,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,1,balanced,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,1,balanced,0.2846720019976298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,1,balanced,0.2775040070215861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,1,balanced,0.27938133478164673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,1,balanced,0.2802346746126811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,1,balanced,0.2815999984741211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,1,balanced,0.28296534220377606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,1,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,1,balanced,0.2974666754404704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,1,balanced,0.29713066418965656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,1,balanced,0.3003679911295573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,1,balanced,0.2988426685333252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,1,balanced,0.3036160071690877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,1,balanced,0.3097599943478902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,1,balanced,0.3211946686108907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,1,balanced,0.3505493402481079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,1,balanced,0.38331735134124756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,1,balanced,0.4771840174992879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,1,balanced,0.5976746479670206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,1,balanced,0.86954665184021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,1,balanced,1.1996160348256428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,1,balanced,1.8631679217020671
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,1,balanced,2.5495893160502114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,1,balanced,3.9193598429361978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,1,balanced,5.299536069234212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,32,power_law_1.01,0.2519040107727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,32,power_law_1.01,0.23859200477600098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,32,power_law_1.01,0.23879680633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,32,power_law_1.01,0.19640320539474487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,32,power_law_1.01,0.21299200057983397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,32,power_law_1.01,0.2420736074447632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,32,power_law_1.01,0.23121919631958007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,32,power_law_1.01,0.24535040855407714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,32,power_law_1.01,0.24637439250946044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,32,power_law_1.01,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,32,power_law_1.01,0.25620479583740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,32,power_law_1.01,0.2568192005157471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,32,power_law_1.01,0.2584575891494751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,32,power_law_1.01,0.2578432083129883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,32,power_law_1.01,0.2590719938278198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,32,power_law_1.01,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,32,power_law_1.01,0.2703360080718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,32,power_law_1.01,0.2942975997924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,32,power_law_1.01,0.37662720680236816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,32,power_law_1.01,0.44890241622924804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,32,power_law_1.01,0.4870143890380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,32,power_law_1.01,0.766156816482544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,32,power_law_1.01,0.901734447479248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,32,power_law_1.01,1.3961215972900392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,128,power_law_1.2,0.028230398893356323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,128,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,32,power_law_1.01,1.760256004333496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,128,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,128,power_law_1.2,0.028224000334739686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,128,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,128,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,32,power_law_1.01,2.5034751892089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,128,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,128,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,128,power_law_1.2,0.03214719891548157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,128,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,128,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,128,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,32,power_law_1.01,3.530547332763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,128,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,128,power_law_1.2,0.032953599095344545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,128,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,128,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,128,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,128,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,128,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,128,power_law_1.2,0.08865280151367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,128,power_law_1.2,0.11141120195388794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,128,power_law_1.2,0.21647360324859619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,128,power_law_1.2,0.2725888013839722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,128,power_law_1.2,0.5441535949707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,128,power_law_1.2,0.7438208103179932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,128,power_law_1.2,1.0473471641540528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,128,power_law_1.2,1.671353530883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,2,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,2,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,2,power_law_1.2,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,2,power_law_1.2,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,2,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,2,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,2,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,2,power_law_1.2,0.07720959782600403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,2,power_law_1.2,0.09502080082893372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,2,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,2,power_law_1.2,0.09072639942169189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,2,power_law_1.2,0.14213119745254515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,2,power_law_1.2,0.16814080476760865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,2,power_law_1.2,0.18575359582901002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,2,power_law_1.2,0.20500481128692627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,2,power_law_1.2,0.2174976110458374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,2,power_law_1.2,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,2,power_law_1.2,0.2766848087310791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,2,power_law_1.2,0.2934783935546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,2,power_law_1.2,0.36126720905303955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,2,power_law_1.2,0.41984000205993655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,2,power_law_1.2,0.5976064205169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,2,power_law_1.2,0.7796735763549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,2,power_law_1.2,1.1978752136230468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,2,power_law_1.2,1.700044822692871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,2,power_law_1.2,2.388787269592285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,2,power_law_1.2,3.3460224151611326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,256,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,256,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,256,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,256,power_law_1.01,0.03888640105724335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,256,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,256,power_law_1.01,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,256,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,256,power_law_1.01,0.04092159867286682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,256,power_law_1.01,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,256,power_law_1.01,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,256,power_law_1.01,0.04237439930438995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,256,power_law_1.01,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,256,power_law_1.01,0.0442111998796463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,256,power_law_1.01,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,256,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,256,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,256,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,256,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,256,power_law_1.01,0.07208960056304932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,256,power_law_1.01,0.09318400025367737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,256,power_law_1.01,0.11776000261306763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,256,power_law_1.01,0.16424959897994995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,256,power_law_1.01,0.21196799278259276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,256,power_law_1.01,0.4278272151947021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,256,power_law_1.01,0.5566463947296143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,256,power_law_1.01,0.8243200302124023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,256,power_law_1.01,1.2040191650390626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,2,power_law_1.2,0.36515839099884034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,2,power_law_1.2,0.37109758853912356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,2,power_law_1.2,0.5253119945526123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,2,power_law_1.2,0.8865792274475097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,2,power_law_1.2,0.8900608062744141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,2,power_law_1.2,0.8957951545715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,2,power_law_1.2,0.901734447479248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,2,power_law_1.2,0.9060352325439454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,2,power_law_1.2,0.9275263786315918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,2,power_law_1.2,0.982630443572998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,2,power_law_1.2,0.9517056465148925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,2,power_law_1.2,1.0618880271911622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,2,power_law_1.2,1.1470848083496095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,16,balanced,0.04266133407751719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,16,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,16,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,16,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,2,power_law_1.2,1.1520000457763673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,16,balanced,0.04775466521581014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,16,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,16,balanced,0.2404693365097046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,16,balanced,0.23142399390538534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,16,balanced,0.23227733373641968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,16,balanced,0.23381332556406656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,2,power_law_1.2,1.2652544021606444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,16,balanced,0.2362026572227478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,16,balanced,0.24183466037114462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,16,balanced,0.24371200799942017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,16,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,16,balanced,0.25975465774536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,16,balanced,0.2650453249613444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,16,balanced,0.27989333868026733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,16,balanced,0.3058346708615621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,2,power_law_1.2,1.3125632286071778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,16,balanced,0.3333119948705037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,16,balanced,0.3838293155034383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,16,balanced,0.42683732509613037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,16,balanced,0.5119839906692505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,16,balanced,0.5952853361765543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,2,power_law_1.2,1.4223360061645507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,16,balanced,0.853653351465861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,16,balanced,1.1351040204366047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,16,balanced,1.6587093671162922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,2,power_law_1.2,1.722368049621582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,16,balanced,2.230954647064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,2,power_law_1.2,2.1176319122314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,2,power_law_1.2,2.555904006958008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,2,power_law_1.2,3.2765953063964846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,2,power_law_1.2,4.126310348510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,2,power_law_1.2,5.308211135864258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.10895359516143799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.28098559379577637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.4190207958221436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.5720064163208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.7565311908721923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.8067071914672852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.8353792190551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,2,balanced,0.06738666693369548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.8687616348266601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,2,balanced,0.2781760096549988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,2,balanced,0.5339999993642172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,2,balanced,1.027242660522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.9150464057922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,2,balanced,2.0278612772623696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.9687040328979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.9945088386535644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,2,balanced,4.02020804087321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,1,power_law_1.01,1.0518527984619142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,1,power_law_1.01,1.1194368362426759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,2,balanced,6.0009816487630205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,1,power_law_1.01,1.173299217224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,1,power_law_1.01,1.264844799041748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,1,power_law_1.01,1.461248016357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,2,balanced,6.009685516357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,2,power_law_1.2,7.910809326171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,1,power_law_1.01,1.6918527603149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,2,balanced,6.027946472167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,1,power_law_1.01,2.0942848205566404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,1,power_law_1.01,2.522316741943359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,2,balanced,6.032549540201823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,1,power_law_1.01,3.400089645385742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,2,balanced,6.066517512003581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,2,balanced,6.071296056111653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,1,power_law_1.01,4.305920028686524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,2,balanced,6.095359802246094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,1,power_law_1.01,6.1466625213623045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,2,balanced,6.14024543762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,2,balanced,6.166528065999349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,1,power_law_1.01,7.979212951660156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,2,balanced,6.199637095133464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,2,balanced,6.259712219238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,1,power_law_1.01,11.660288238525391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,2,balanced,6.390954971313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,2,balanced,6.688767751057942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,2,balanced,6.930773417154948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,1,power_law_1.01,15.3849853515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,2,balanced,7.163381576538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,2,balanced,7.668053309122722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,2,balanced,8.592042922973633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,2,balanced,9.159680048624674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,2,balanced,10.056533177693685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,2,balanced,12.668416341145834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,2,balanced,15.144448598225912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,2,power_law_1.2,10.392166137695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.6074368000030518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,1,power_law_1.2,1.051238441467285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,1,power_law_1.2,2.027315139770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,1,power_law_1.2,4.036608123779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,2,power_law_1.2,13.934182739257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,1,power_law_1.2,6.4614402770996096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,1,power_law_1.2,9.134899139404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,1,power_law_1.2,10.568498992919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,1,power_law_1.2,15.361228942871094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,1,power_law_1.2,15.944703674316406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,1,power_law_1.2,16.476979064941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,1,power_law_1.2,17.451622009277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,1,power_law_1.2,17.973452758789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,1,power_law_1.2,18.390016174316408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,1,power_law_1.2,19.24669494628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,1,power_law_1.2,20.145356750488283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,1,power_law_1.2,20.260659790039064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,1,power_law_1.2,21.298381042480468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,1,power_law_1.2,23.78035125732422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,1,power_law_1.2,0.6060031890869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,1,power_law_1.2,1.0383359909057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,1,power_law_1.2,24.078746032714843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,1,power_law_1.2,2.016870307922363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,1,power_law_1.2,3.709747314453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,2,power_law_1.2,18.506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,1,power_law_1.2,5.69958381652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,64,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,1,power_law_1.2,7.12273941040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,64,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,64,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,1,power_law_1.2,25.510707092285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,64,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,64,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,64,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,64,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,1,power_law_1.2,11.176953887939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,64,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,64,power_law_1.2,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,64,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,64,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,64,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,64,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,64,power_law_1.2,0.05856000185012818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,64,power_law_1.2,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,64,power_law_1.2,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,1,power_law_1.2,11.792793273925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,64,power_law_1.2,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,64,power_law_1.2,0.10690560340881347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,64,power_law_1.2,0.12615679502487182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,64,power_law_1.2,0.1615872025489807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,1,power_law_1.2,26.516683959960936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,64,power_law_1.2,0.2623487949371338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,64,power_law_1.2,0.3653631925582886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,64,power_law_1.2,0.44994559288024905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,64,power_law_1.2,0.6537216186523438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,1,power_law_1.2,12.281651306152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,64,power_law_1.2,0.9840640068054199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,64,power_law_1.2,1.641472053527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,1,power_law_1.2,12.724838256835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,64,power_law_1.2,2.467020797729492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,1,power_law_1.2,28.896255493164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,1,power_law_1.2,13.155123901367187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,1,power_law_1.2,13.137306213378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,1,power_law_1.2,33.346963500976564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,1,power_law_1.2,13.6880126953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,4,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,4,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,4,balanced,0.09062400460243225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,4,balanced,0.3071733315785726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,4,balanced,0.5782186587651571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,4,balanced,0.7113386789957682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,4,balanced,0.7150932947794596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,4,balanced,0.7145813306172689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,4,balanced,0.7178239822387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,4,balanced,0.7203839619954427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,4,balanced,0.7277226448059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,4,balanced,0.73471999168396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,4,balanced,0.7406933307647705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,4,balanced,0.7500800291697184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,4,balanced,0.764245351155599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,4,balanced,0.7741440137227377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,4,balanced,0.7958186467488607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,1,power_law_1.2,14.034124755859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,4,balanced,0.8435946305592855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,4,balanced,0.8924160003662109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,4,balanced,0.964949369430542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,4,balanced,1.0465280214945476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,4,balanced,1.2439893086751301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,8,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,4,balanced,1.4675626754760742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,8,power_law_1.01,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,8,power_law_1.01,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,4,balanced,1.9135146141052246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,8,power_law_1.01,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,8,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,8,power_law_1.01,0.024966399371623992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,4,balanced,2.42739200592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,8,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,8,power_law_1.01,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,1,power_law_1.2,14.925004577636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,8,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,8,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,8,power_law_1.01,0.0265855997800827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,4,balanced,3.4742612838745117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,8,power_law_1.01,0.028044798970222475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,8,power_law_1.01,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,1,power_law_1.2,40.29480895996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,8,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,8,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,8,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,8,power_law_1.01,0.03806720077991486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,8,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,8,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,8,power_law_1.01,0.07041280269622803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,1,power_law_1.2,14.869708251953124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,8,power_law_1.01,0.08171520233154297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,8,power_law_1.01,0.11161600351333618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,8,power_law_1.01,0.18862080574035645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,4,balanced,4.66209061940511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,8,power_law_1.01,0.28016641139984133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,8,power_law_1.01,0.39342079162597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,8,power_law_1.01,0.7008255958557129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,8,power_law_1.01,0.9295871734619141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,1,power_law_1.2,15.545549011230468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,1,power_law_1.2,16.403660583496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,1,power_law_1.2,45.08323974609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,1,power_law_1.2,16.923429870605467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,1,power_law_1.2,18.021580505371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,1,power_law_1.2,19.39271697998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,1,power_law_1.2,58.544744873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,1,power_law_1.2,21.889433288574217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,1,power_law_1.2,23.14055633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,1,power_law_1.2,57.7101806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,1,power_law_1.2,28.309707641601562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,1,power_law_1.2,33.59416198730469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.6053887844085694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,1,power_law_1.01,1.0483712196350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,1,power_law_1.01,2.0336639404296877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,1,power_law_1.2,43.269735717773436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,1,power_law_1.01,4.07982063293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,1,power_law_1.01,6.179840087890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,1,power_law_1.01,8.002150726318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,1,power_law_1.01,11.431724548339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,1,power_law_1.01,11.930419158935546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,1,power_law_1.2,53.926910400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,1,power_law_1.01,12.661145782470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,1,power_law_1.01,12.944589233398437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,1,power_law_1.01,13.265510559082031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,1,power_law_1.01,13.541786193847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,1,power_law_1.01,13.600358581542968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,1,power_law_1.01,14.214962768554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,1,power_law_1.01,14.72716827392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,1,power_law_1.01,14.706278991699218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,4,8,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,4,8,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,4,8,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,4,8,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,4,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,4,8,power_law_1.2,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,4,8,power_law_1.2,0.03684479892253876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,4,8,power_law_1.2,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,4,8,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,1,power_law_1.01,15.791513061523437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,4,8,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,4,8,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,4,8,power_law_1.2,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,4,8,power_law_1.2,0.04668799936771393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,4,8,power_law_1.2,0.055878400802612305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,4,8,power_law_1.2,0.05978879928588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,4,8,power_law_1.2,0.062463998794555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,4,8,power_law_1.2,0.08680959939956664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,4,8,power_law_1.2,0.1521407961845398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,4,8,power_law_1.2,0.2095103979110718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,4,8,power_law_1.2,0.2637824058532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,4,8,power_law_1.2,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,4,8,power_law_1.2,0.40919041633605957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,1,power_law_1.01,16.875315856933593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,4,8,power_law_1.2,0.505241584777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,1,power_law_1.01,17.079705810546876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,4,8,power_law_1.2,0.9496576309204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,1,power_law_1.01,18.276556396484374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,1,power_law_1.01,19.0385986328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,4,8,power_law_1.2,1.3072064399719239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,1,power_law_1.01,20.99630126953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,1,power_law_1.01,23.629618835449218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,1,power_law_1.01,30.183627319335937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,1,power_law_1.01,29.763583374023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,1,power_law_1.01,38.543768310546874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,1,power_law_1.01,46.862936401367186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,4,8,power_law_1.2,1.8350080490112304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,64,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,64,balanced,0.057855998476346336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,64,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,64,balanced,0.057002668579419456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,64,balanced,0.28654932975769043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,64,balanced,0.5452800194422404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,64,balanced,0.5474986632664999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,64,balanced,0.5493760108947754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,64,balanced,0.5500586827596029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,64,balanced,0.5510826508204142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,64,balanced,0.5533013343811035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,64,balanced,0.5563733180363973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,64,balanced,0.5585920015970866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,64,balanced,0.5614933172861735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,64,balanced,0.5667680104573568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,64,balanced,0.5691733360290527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,64,balanced,0.5763413508733114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,64,balanced,0.5951146682103475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,64,balanced,0.6079146862030029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,64,balanced,0.656544009844462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,64,balanced,0.6876107056935629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,1,balanced,1.5916372934977214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,64,balanced,0.7918933232625326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,64,balanced,0.8198826313018799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,1,balanced,2.823850631713867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,64,balanced,1.106602668762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,2,power_law_1.01,0.34549760818481445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,64,balanced,1.2776106993357341
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,2,power_law_1.01,0.52674560546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,1,balanced,5.726378758748372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,64,balanced,1.721002737681071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,2,power_law_1.01,0.8216575622558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,4,8,power_law_1.2,2.2757375717163084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,2,power_law_1.01,1.194803237915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,64,balanced,2.229248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,2,power_law_1.01,1.5259648323059083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,1,balanced,11.142826080322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,2,power_law_1.01,2.3953407287597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,2,power_law_1.01,2.3662527084350584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,2,power_law_1.01,2.392064094543457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,2,power_law_1.01,2.3955455780029298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,2,power_law_1.01,2.5577472686767577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,1,balanced,21.9069341023763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,2,power_law_1.01,2.555289649963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,2,power_law_1.01,2.573721694946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,2,power_law_1.01,2.7117504119873046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,2,power_law_1.01,2.775859260559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,2,power_law_1.01,2.837504005432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,2,power_law_1.01,2.869638442993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,2,power_law_1.01,2.997862434387207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,1,balanced,32.32494862874349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,2,power_law_1.01,3.196518325805664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,4,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,4,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,4,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,2,power_law_1.01,3.3492992401123045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,4,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,4,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,4,power_law_1.01,0.20131840705871581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,4,power_law_1.01,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,4,power_law_1.01,0.21913599967956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,2,power_law_1.01,3.565951919555664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,4,power_law_1.01,0.23060479164123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,4,power_law_1.01,0.23470079898834229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,4,power_law_1.01,0.23490560054779053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,4,power_law_1.01,0.24944639205932617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,4,power_law_1.01,0.23756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,2,power_law_1.01,3.751731109619141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,4,power_law_1.01,0.2519040107727051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,4,power_law_1.01,0.2537472009658813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,4,power_law_1.01,0.2610879898071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,4,power_law_1.01,0.260096001625061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,4,power_law_1.01,0.27873280048370364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,2,power_law_1.01,4.721868896484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,4,power_law_1.01,0.2799616098403931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,4,power_law_1.01,0.31600639820098875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,4,power_law_1.01,0.349183988571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,4,power_law_1.01,0.43438081741333007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,4,power_law_1.01,0.5378047943115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,1,balanced,32.3788808186849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,2,power_law_1.01,5.021900939941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,4,power_law_1.01,0.8155136108398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,4,power_law_1.01,1.0188799858093263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,4,power_law_1.01,1.500160026550293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,2,power_law_1.01,6.355558395385742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,4,power_law_1.01,1.9347455978393555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,2,power_law_1.01,8.475833892822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,1,balanced,32.45038859049479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,2,power_law_1.01,11.4302978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,2,power_law_1.01,14.507621765136719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,1,balanced,32.50055440266927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,1,balanced,32.54664611816406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,1,balanced,32.6652577718099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,1,balanced,32.77124277750651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,1,balanced,32.90060679117838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,1,balanced,33.08373260498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,1,balanced,33.27061208089193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,128,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,128,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,128,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,128,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,128,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,128,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,128,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,128,power_law_1.2,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,128,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,128,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,128,power_law_1.2,0.05447040200233459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,1,balanced,33.44315846761068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,128,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,128,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,128,power_law_1.2,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,2,power_law_1.2,0.19251199960708618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,128,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,2,power_law_1.2,0.285696005821228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,128,power_law_1.2,0.07167999744415283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,2,power_law_1.2,0.5152768135070801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,128,power_law_1.2,0.08089600205421447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,2,power_law_1.2,0.7116799831390381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,128,power_law_1.2,0.11038719415664673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,128,power_law_1.2,0.14561280012130737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,2,power_law_1.2,0.8859647750854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,128,power_law_1.2,0.25620479583740235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,2,power_law_1.2,1.4403583526611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,128,power_law_1.2,0.35573759078979494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,2,power_law_1.2,1.5093759536743163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,128,power_law_1.2,0.5148672103881836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,2,power_law_1.2,1.6254976272583008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,128,power_law_1.2,0.728268814086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,2,power_law_1.2,1.6429056167602538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,128,power_law_1.2,1.1104255676269532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,2,power_law_1.2,1.6623424530029296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,128,power_law_1.2,1.7936384201049804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,2,power_law_1.2,1.7301504135131835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,2,power_law_1.2,1.7553407669067382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,1,balanced,33.78090159098307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,128,power_law_1.2,2.5311168670654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,2,power_law_1.2,1.740595245361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,2,power_law_1.2,1.8759679794311523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,2,power_law_1.2,1.862246322631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,128,power_law_1.2,3.773235321044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,2,power_law_1.2,1.9580928802490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,2,power_law_1.2,1.9386367797851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,2,power_law_1.2,2.0058111190795898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,2,power_law_1.2,2.101043128967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,2,power_law_1.2,2.2700031280517576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,2,power_law_1.2,2.52805118560791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,2,power_law_1.2,2.9243392944335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,1,balanced,38.63705698649088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,2,power_law_1.2,3.1076351165771485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,2,power_law_1.2,3.9796737670898437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,2,power_law_1.2,4.810137557983398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,1,balanced,35.66967519124349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,2,power_law_1.2,6.546227264404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,1,balanced,42.30331675211588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,1,balanced,35.14384969075521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,1,balanced,37.31097666422526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,1,balanced,39.17772674560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,1,balanced,44.59656778971354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,2,power_law_1.2,7.710514831542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,1,balanced,47.986348470052086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,1,balanced,66.43677775065105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,1,balanced,78.68979390462239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,4,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,4,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,4,power_law_1.01,0.09625599980354309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,4,power_law_1.01,0.18903039693832396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,4,power_law_1.01,0.22261760234832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,4,power_law_1.01,0.30801920890808104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,4,power_law_1.01,0.3299328088760376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,4,power_law_1.01,0.3563391923904419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,4,power_law_1.01,0.35287039279937743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,4,power_law_1.01,0.3616767883300781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,4,power_law_1.01,0.36228480339050295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,4,power_law_1.01,0.3811327934265137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,4,power_law_1.01,0.3772416114807129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,4,power_law_1.01,0.3895296096801758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,4,power_law_1.01,0.4214784145355225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,4,power_law_1.01,0.43335680961608886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,4,power_law_1.01,0.4521984100341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,4,power_law_1.01,0.4808703899383545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,4,power_law_1.01,0.5216256141662597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,4,power_law_1.01,0.6170623779296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,4,power_law_1.01,0.7397312164306641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,4,power_law_1.01,1.0579968452453614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,4,power_law_1.01,1.2283904075622558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,4,power_law_1.01,1.6365568161010742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,4,power_law_1.01,2.31280632019043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,4,power_law_1.01,3.6710273742675783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,4,power_law_1.01,4.698521423339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,8,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,8,power_law_1.2,0.0331712007522583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,8,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,8,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,8,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,8,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,8,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,8,power_law_1.2,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,8,power_law_1.2,0.0741375982761383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,8,power_law_1.2,0.0747327983379364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,8,power_law_1.2,0.08007680177688599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,8,power_law_1.2,0.10465279817581177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,8,power_law_1.2,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,8,power_law_1.2,0.1253376007080078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,128,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,128,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,128,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,128,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,128,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,128,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,128,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,128,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,128,balanced,0.03377600014209747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,128,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,128,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,128,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,128,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,128,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,128,balanced,0.03856533269087473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,128,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,128,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,128,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,128,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,128,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,128,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,128,balanced,0.07918933530648549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,128,balanced,0.17748266458511353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,128,balanced,0.30719467004140216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,8,power_law_1.2,0.17428480386734008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,128,balanced,0.38603198528289795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,128,balanced,0.6101333300272623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,128,balanced,0.8031573295593262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,8,power_law_1.2,0.2258944034576416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,8,power_law_1.2,0.35777280330657957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,128,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,128,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,128,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,128,power_law_1.2,0.038899201154708865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,128,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,8,power_law_1.2,0.5089280128479003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,128,power_law_1.2,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,128,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,128,power_law_1.2,0.04175359904766083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,128,power_law_1.2,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,128,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,128,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,128,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,128,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,128,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,128,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,128,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,128,power_law_1.2,0.09441279768943786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,128,power_law_1.2,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,128,power_law_1.2,0.15319039821624755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,128,power_law_1.2,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,128,power_law_1.2,0.28323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,128,power_law_1.2,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,128,power_law_1.2,0.4900479793548584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,128,power_law_1.2,0.7606272220611572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,128,power_law_1.2,1.0508288383483886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,128,power_law_1.2,1.466982364654541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,8,power_law_1.2,0.7430143833160401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,128,power_law_1.2,2.879283142089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,8,power_law_1.2,1.0500096321105956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,64,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,64,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,64,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,64,power_law_1.01,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,64,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,64,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,64,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,64,power_law_1.01,0.05464320182800293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,64,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,64,power_law_1.01,0.05549439787864685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,64,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,64,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,8,power_law_1.2,1.6457664489746093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,64,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,2,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,64,power_law_1.01,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,2,power_law_1.01,0.1388543963432312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,64,power_law_1.01,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,2,power_law_1.01,0.24204161167144775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,64,power_law_1.01,0.08929280042648316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,2,power_law_1.01,0.38399999141693114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,64,power_law_1.01,0.12305920124053955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,2,power_law_1.01,0.5216256141662597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,64,power_law_1.01,0.18882559537887572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,2,power_law_1.01,0.8067071914672852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,64,power_law_1.01,0.21770238876342773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,2,power_law_1.01,0.7643136024475098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,64,power_law_1.01,0.28487040996551516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,2,power_law_1.01,0.8493056297302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,2,power_law_1.01,0.8345600128173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,64,power_law_1.01,0.3180543899536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,2,power_law_1.01,0.8144895553588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,64,power_law_1.01,0.4376383781433105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,2,power_law_1.01,0.862003231048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,2,power_law_1.01,0.8955904006958008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,64,power_law_1.01,0.5330880165100098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,2,power_law_1.01,0.8880127906799317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,2,power_law_1.01,0.9293696403503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,64,power_law_1.01,0.7782400131225586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,2,power_law_1.01,0.940236759185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,2,power_law_1.01,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,2,power_law_1.01,0.9713664054870605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,64,power_law_1.01,1.0807295799255372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,2,power_law_1.01,1.0016768455505372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,2,power_law_1.01,1.0563584327697755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,2,power_law_1.01,1.1613887786865233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,64,power_law_1.01,1.6717824935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,2,power_law_1.01,1.2437503814697266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,2,power_law_1.01,1.5382143974304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,64,power_law_1.01,2.3005184173583983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,2,power_law_1.01,1.6226303100585937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,2,power_law_1.01,2.0932416915893555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,2,power_law_1.01,2.535219192504883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,2,power_law_1.01,3.625574493408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,2,power_law_1.01,4.471155166625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,32,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,32,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,32,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,32,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,32,balanced,0.2969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,32,balanced,0.560640017191569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,32,balanced,0.8263680140177408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,32,balanced,0.8294400374094645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,32,balanced,0.8306346734364828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,32,balanced,0.8330132961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,32,balanced,0.836949348449707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,32,balanced,0.8424106438954672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,32,balanced,0.8439466953277588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,32,balanced,0.8512852986653646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,32,balanced,0.859989325205485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,32,balanced,0.8663040002187093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,32,balanced,0.8837119738260905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,32,balanced,0.9084586302439371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,32,balanced,0.9374720255533854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,32,balanced,0.9912319978078207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,32,balanced,1.0963626702626545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,32,balanced,1.1856213410695393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,32,balanced,1.2612266540527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,32,balanced,1.460053284962972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,32,balanced,1.7032532691955566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,32,balanced,2.2992213567097983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,32,balanced,2.9755732218424478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,8,power_law_1.2,2.325503921508789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,8,power_law_1.2,3.2313343048095704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,32,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,32,balanced,0.03908266623814901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,32,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,32,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,32,balanced,0.18858667214711508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,32,balanced,0.3546453317006429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,32,balanced,0.3563520113627116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,32,balanced,0.35839998722076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,32,balanced,0.36027733484903973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,32,balanced,0.36061867078145343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,32,balanced,0.36181334654490155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,32,balanced,0.3643733263015747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,32,balanced,0.3652213414510091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,32,balanced,0.36744534969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,32,balanced,0.3710293372472127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,32,balanced,0.3845119873682658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,32,balanced,0.37700267632802326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,32,balanced,0.3891040086746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,32,balanced,0.398848017056783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,32,balanced,0.4020906686782837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,32,balanced,0.4283733367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,32,balanced,0.475818673769633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,32,balanced,0.5056853294372559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,32,balanced,0.5821439822514852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,32,balanced,0.6447786490122477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,32,balanced,0.8425813515981039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,32,balanced,1.0605226357777913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,8,power_law_1.2,4.800921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,2,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,2,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,2,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,2,power_law_1.2,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,2,power_law_1.2,0.1937343955039978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,2,power_law_1.2,0.3790528059005737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,2,power_law_1.2,0.39546880722045896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,2,power_law_1.2,0.43108482360839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,2,power_law_1.2,0.43274240493774413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,2,power_law_1.2,0.4413440227508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,2,power_law_1.2,0.4591616153717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,2,power_law_1.2,0.4767744064331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,2,power_law_1.2,0.4734975814819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,2,power_law_1.2,0.4920959949493408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,2,power_law_1.2,0.49930238723754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,2,power_law_1.2,0.5085184097290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,2,power_law_1.2,0.5277696132659913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,2,power_law_1.2,0.535756778717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,2,power_law_1.2,0.6057919979095459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,2,power_law_1.2,0.6868991851806641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,2,power_law_1.2,0.7284736156463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,2,power_law_1.2,0.9543680191040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,2,power_law_1.2,1.1306879997253418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,2,power_law_1.2,1.486233615875244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,2,power_law_1.2,1.8139135360717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,2,power_law_1.2,2.616320037841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,2,power_law_1.2,3.3535743713378907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,4,balanced,0.03788800040880839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,4,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,4,balanced,0.16827734311421713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,4,balanced,0.3505493402481079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,4,balanced,0.6695253054300944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,4,balanced,1.2965546449025471
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,4,balanced,1.2986026604970295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,4,balanced,1.303381363550822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,4,balanced,1.3057706356048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,4,balanced,1.308672030766805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,4,balanced,1.312597354253133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,4,balanced,1.3177173137664795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,4,balanced,1.323520024617513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,4,balanced,1.332367976506551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,4,balanced,1.3453653653462727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,4,balanced,1.3573120435078938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,4,balanced,1.3730133374532063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,4,balanced,1.443328062693278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,4,balanced,1.4786559740702312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,4,balanced,1.467733383178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,4,balanced,1.5569920539855957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,4,balanced,1.6790186564127605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,4,balanced,1.817087968190511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,4,balanced,2.102442741394043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,4,balanced,2.386943976084391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,4,balanced,3.057663917541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,4,balanced,3.8555307388305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,64,power_law_1.2,0.02229759991168976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,64,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,8,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,8,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,8,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,8,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,8,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,8,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,8,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,8,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,8,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,8,balanced,0.04130133241415024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,8,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,8,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,8,balanced,0.04350399971008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,8,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,8,balanced,0.04828266799449921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,8,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,8,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,8,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,8,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,64,power_law_1.2,0.021913599967956544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,8,balanced,0.08123733103275299
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,8,balanced,0.09267200032869975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,64,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,8,balanced,0.16366933782895407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,64,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,64,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,8,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,64,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,8,balanced,0.37853864828745526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,64,power_law_1.2,0.023520000278949738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,64,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,8,balanced,0.4983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,64,power_law_1.2,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,64,power_law_1.2,0.02455040067434311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,8,balanced,0.7785813013712565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,64,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,64,power_law_1.2,0.025190401077270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,64,power_law_1.2,0.026188799738883974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,8,balanced,1.1303253173828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,64,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,64,power_law_1.2,0.02887679934501648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,64,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,64,power_law_1.2,0.03828479945659637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,64,power_law_1.2,0.04565759897232056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,64,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,64,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,64,power_law_1.2,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,64,power_law_1.2,0.11816960573196411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,64,power_law_1.2,0.2732032060623169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,64,power_law_1.2,0.33361918926239015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,1,power_law_1.2,0.6094848155975342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,1,power_law_1.2,1.0999808311462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,1,power_law_1.2,2.0398080825805662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,1,power_law_1.2,3.246694564819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,1,power_law_1.2,4.372275161743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,64,power_law_1.2,0.5396480083465576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,1,power_law_1.2,8.100863647460937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,1,power_law_1.2,8.487935638427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,1,power_law_1.2,9.070387268066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,1,power_law_1.2,9.375129699707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,1,power_law_1.2,9.743360137939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,1,power_law_1.2,10.116710662841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,1,power_law_1.2,10.051789093017579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,1,power_law_1.2,10.343424224853516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,1,power_law_1.2,10.665574645996093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,1,power_law_1.2,10.864844512939452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,4,power_law_1.01,0.5754879951477051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,4,power_law_1.01,0.9699328422546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,4,power_law_1.01,1.1696127891540526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,1,power_law_1.2,10.890854644775391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,4,power_law_1.01,1.3832192420959473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,4,power_law_1.01,1.7305536270141602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,4,power_law_1.01,2.226585578918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,4,power_law_1.01,2.2063104629516603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,1,power_law_1.2,11.153817749023437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,4,power_law_1.01,2.348031997680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,4,power_law_1.01,2.4465408325195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,4,power_law_1.01,2.5573375701904295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,4,power_law_1.01,2.5939968109130858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,1,power_law_1.2,11.667046356201173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,4,power_law_1.01,2.4995840072631834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,4,power_law_1.01,2.6187776565551757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,4,power_law_1.01,2.5862144470214843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,1,power_law_1.2,12.034867095947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,4,power_law_1.01,2.6411008834838867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,4,power_law_1.01,2.7396095275878904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,4,power_law_1.01,2.7846656799316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,4,power_law_1.01,2.937651252746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,1,power_law_1.2,12.848538208007813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,4,power_law_1.01,3.063193511962891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,4,power_law_1.01,3.3880062103271484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,4,power_law_1.01,3.6470783233642576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,1,power_law_1.2,14.031666564941407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,4,power_law_1.01,4.550233459472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,4,power_law_1.01,5.180819320678711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,4,power_law_1.01,7.283097839355468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,1,power_law_1.2,16.793600463867186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,4,power_law_1.01,8.241766357421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,1,power_law_1.2,18.633319091796874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,4,power_law_1.01,12.333055877685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,4,power_law_1.01,14.855577087402343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,1,power_law_1.2,24.132199096679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,64,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,64,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,64,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,64,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,64,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,64,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,64,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,64,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,64,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,64,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,64,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,64,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,64,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,64,balanced,0.04009066770474116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,64,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,64,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,64,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,64,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,64,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,64,balanced,0.06400000055631001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,64,balanced,0.0727040022611618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,64,balanced,0.0936959981918335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,64,balanced,0.10990933577219646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,64,balanced,0.2529279987017314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,64,balanced,0.3418453137079875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,64,balanced,0.5031253496805826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,64,balanced,0.680618683497111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,1,power_law_1.2,28.90772399902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,64,power_law_1.2,0.6973440170288085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,1,power_law_1.2,38.8790283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,64,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,64,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,64,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,64,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,64,balanced,0.048298666874567665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,64,balanced,0.05085866649945577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,64,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,64,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,64,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,64,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,64,balanced,0.05341866612434387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,64,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,64,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,64,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,64,balanced,0.060415998101234436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,64,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,64,balanced,0.06621333460013072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,64,balanced,0.0730453332265218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,64,balanced,0.08021333316961925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,64,balanced,0.15359999736150107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,64,balanced,0.2435413400332133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,64,balanced,0.3259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,64,balanced,0.3979946772257487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,64,balanced,0.5719039837519327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,64,balanced,0.7459839979807535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,64,balanced,1.1168426672617595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,64,balanced,1.4848000208536785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,1,power_law_1.2,48.27607116699219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,1,8,power_law_1.01,0.03234559893608093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,1,8,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,1,8,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,64,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,64,power_law_1.01,0.024537600576877594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,64,power_law_1.01,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,64,power_law_1.01,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,1,8,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,64,power_law_1.01,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,1,8,power_law_1.01,0.02968960106372833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,1,8,power_law_1.01,0.03375999927520752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,1,8,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,64,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,1,8,power_law_1.01,0.03519999980926514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,64,power_law_1.01,0.026182401180267333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,1,8,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,64,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,1,8,power_law_1.01,0.03560320138931274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,64,power_law_1.01,0.026822400093078614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,1,8,power_law_1.01,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,64,power_law_1.01,0.02723200023174286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,1,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,64,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,1,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,64,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,1,8,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,64,power_law_1.01,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,1,8,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,64,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,1,8,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,64,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,1,8,power_law_1.01,0.06695680022239685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,64,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,1,8,power_law_1.01,0.07905279994010925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,64,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,1,8,power_law_1.01,0.10216959714889526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,64,power_law_1.01,0.07021440267562866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,1,8,power_law_1.01,0.1505280017852783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,64,power_law_1.01,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,1,8,power_law_1.01,0.20295679569244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,64,power_law_1.01,0.1361791968345642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,1,8,power_law_1.01,0.2648063898086548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,64,power_law_1.01,0.27504639625549315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,1,8,power_law_1.01,0.3338239908218384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,64,power_law_1.01,0.34628479480743407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,1,8,power_law_1.01,0.5007359981536865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,64,power_law_1.01,0.5081088066101074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,1,8,power_law_1.01,0.6459392070770263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,64,power_law_1.01,0.7120575904846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,1,8,power_law_1.01,1.024409580230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,1,8,power_law_1.01,1.3451007843017577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,64,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,64,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,64,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,64,balanced,0.032069332897663116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,64,balanced,0.03293866664171219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,64,balanced,0.03393599887688955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,64,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,64,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,64,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,64,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,64,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,64,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,64,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,64,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,64,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,64,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,64,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,64,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,64,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,64,balanced,0.09657067060470581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,64,balanced,0.09045333663622539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,64,balanced,0.19336533546447754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,64,balanced,0.2218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,64,balanced,0.311296006043752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,64,balanced,0.35020800431569415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,64,balanced,0.5562026500701904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,64,balanced,0.694271961847941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,32,power_law_1.01,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,32,power_law_1.01,0.050374400615692136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,32,power_law_1.01,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,32,power_law_1.01,0.049958398938179015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,32,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,32,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,32,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,32,power_law_1.01,0.05303679704666138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,32,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,32,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,32,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,32,power_law_1.01,0.06451200246810913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,32,power_law_1.01,0.06615039706230164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,32,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,32,power_law_1.01,0.07434239983558655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,32,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,32,power_law_1.01,0.08642560243606567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,32,power_law_1.01,0.09768959879875183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,32,power_law_1.01,0.12677119970321654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,32,power_law_1.01,0.1708032011985779
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,32,power_law_1.01,0.24637439250946044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,32,power_law_1.01,0.3586047887802124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,32,power_law_1.01,0.46837759017944336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,32,power_law_1.01,0.8316927909851074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,32,power_law_1.01,1.0045439720153808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,32,power_law_1.01,1.746944046020508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,32,power_law_1.01,2.291302490234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,128,power_law_1.01,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,128,power_law_1.01,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,128,power_law_1.01,0.28487679958343504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,128,power_law_1.01,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,128,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,128,power_law_1.01,0.2902015924453735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,128,power_law_1.01,0.2916352033615112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,128,power_law_1.01,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,128,power_law_1.01,0.29409279823303225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,128,power_law_1.01,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,128,power_law_1.01,0.29675519466400146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,128,power_law_1.01,0.3026943922042847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,128,power_law_1.01,0.3037184000015259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,128,power_law_1.01,0.3071808099746704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,128,power_law_1.01,0.3086335897445679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,128,power_law_1.01,0.3250175952911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,128,power_law_1.01,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,128,power_law_1.01,0.3858432054519653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,128,power_law_1.01,0.42352638244628904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,128,power_law_1.01,0.5902336120605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,128,power_law_1.01,0.6782976150512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,128,power_law_1.01,1.003110408782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,128,power_law_1.01,1.3066240310668946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,128,power_law_1.01,1.8106367111206054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,16,16,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,16,16,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,16,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,16,16,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,16,16,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,128,power_law_1.01,2.4311807632446287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,16,16,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,16,16,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,16,16,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,16,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,16,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,16,16,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,16,16,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,16,16,balanced,0.036501333117485046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,16,16,balanced,0.03736000011364619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,16,16,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,16,16,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,16,16,balanced,0.043663998444875084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,16,16,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,16,16,balanced,0.049141332507133484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,16,16,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,16,16,balanced,0.06621866424878438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,16,16,balanced,0.08994133273760478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,128,power_law_1.01,4.4130302429199215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,16,16,balanced,0.17339734236399332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,16,16,balanced,0.3068586587905884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,128,power_law_1.01,5.636710357666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,16,16,balanced,0.36744534969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,16,16,balanced,0.5889706611633301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,16,16,balanced,0.7825067043304443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,2,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,2,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,2,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,2,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,2,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,2,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,2,power_law_1.2,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,2,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,2,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,2,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,2,power_law_1.2,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,2,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,2,power_law_1.2,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,2,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,2,power_law_1.2,0.09523199796676636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,2,power_law_1.2,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,2,power_law_1.2,0.13741439580917358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,2,power_law_1.2,0.22466559410095216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,2,power_law_1.2,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,2,power_law_1.2,0.39996159076690674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,2,power_law_1.2,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,2,power_law_1.01,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,2,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,2,power_law_1.01,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,2,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,2,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,2,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,2,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,2,power_law_1.01,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,2,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,2,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,2,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,2,power_law_1.01,0.06410239934921265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,2,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,2,power_law_1.01,0.08089600205421447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,2,power_law_1.01,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,2,power_law_1.01,0.104038405418396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,2,power_law_1.01,0.13496320247650145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,2,power_law_1.01,0.21483519077301025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,2,power_law_1.01,0.24431359767913818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,2,power_law_1.2,0.5916672229766846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,2,power_law_1.01,0.3463167905807495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,2,power_law_1.01,0.4632575988769531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,2,power_law_1.01,0.7956480026245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,2,power_law_1.01,0.8282112121582031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,2,power_law_1.01,1.3420543670654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,2,power_law_1.2,0.9533439636230469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,2,power_law_1.01,1.9924991607666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,2,power_law_1.2,1.39999361038208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,2,power_law_1.01,3.2681983947753905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,1,balanced,0.06705600023269653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,1,balanced,0.29201066493988037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,1,balanced,0.5307733217875162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,1,balanced,1.0241706371307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,1,balanced,2.039466698964437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,1,balanced,3.9582719802856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,1,balanced,3.97926394144694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,1,balanced,3.990858713785807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,1,balanced,4.010837237040202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,1,balanced,4.023807843526204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,1,balanced,4.052138646443685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,2,balanced,0.02611200014750163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,2,balanced,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,2,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,2,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,2,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,2,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,2,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,2,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,2,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,2,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,1,balanced,4.081653277079265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,2,balanced,0.02849599967400233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,2,balanced,0.030373332401116688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,2,balanced,0.031210665901501972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,2,balanced,0.03156266609827677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,2,balanced,0.03990400085846583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,2,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,2,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,2,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,2,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,2,balanced,0.09779199957847595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,1,balanced,4.106752077738444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,2,balanced,0.1181013286113739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,2,balanced,0.2474666635195414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,2,balanced,0.32255999247233075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,2,balanced,0.4776959816614787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,1,balanced,4.156415939331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,2,balanced,0.6563839912414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,2,balanced,1.0697387059529622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,1,balanced,4.21068795522054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,2,balanced,1.4789973894755046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,1,balanced,4.25930118560791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,1,balanced,4.352853457132976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,1,balanced,4.525568008422852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,1,balanced,4.706645329793294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,1,balanced,5.073237419128418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,1,balanced,5.465429306030273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,1,balanced,6.383103688557942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,1,balanced,6.904629389444987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,1,balanced,8.377344131469727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,1,power_law_1.2,0.24861440658569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,1,balanced,9.793365478515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,1,power_law_1.2,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,1,power_law_1.2,0.7327744007110596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,1,power_law_1.2,1.1610112190246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,1,power_law_1.2,1.6121856689453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,1,balanced,13.253461201985678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,1,power_law_1.2,2.928396797180176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,1,power_law_1.2,3.2026622772216795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,1,power_law_1.2,3.3325054168701174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,2,power_law_1.2,2.007040023803711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,1,balanced,16.612164815266926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,1,power_law_1.2,3.4711551666259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,1,power_law_1.2,3.5297279357910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,1,power_law_1.2,3.7365760803222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,1,power_law_1.2,3.7984256744384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,1,power_law_1.2,3.867443084716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,2,power_law_1.01,4.242841720581055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,1,power_law_1.2,4.099276733398438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,1,power_law_1.2,4.2215423583984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,1,power_law_1.2,4.306943893432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,1,power_law_1.2,4.468121719360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,1,power_law_1.2,4.860108947753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,1,power_law_1.2,5.2066303253173825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,1,power_law_1.2,5.917491149902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,1,power_law_1.2,6.5511421203613285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,1,power_law_1.2,7.985343933105469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,1,power_law_1.2,9.139199829101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,1,power_law_1.2,11.802009582519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,1,power_law_1.2,14.076518249511718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,1,power_law_1.2,19.786341857910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,2,power_law_1.2,3.0345216751098634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,1,power_law_1.2,25.026765441894533
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,128,power_law_1.2,0.2545664072036743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,128,power_law_1.2,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,128,power_law_1.2,0.2283519983291626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,128,power_law_1.2,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,128,power_law_1.2,0.1955839991569519
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,128,power_law_1.2,0.09830399751663207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,128,power_law_1.2,0.10485759973526002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,128,power_law_1.2,0.23613440990447998
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,128,power_law_1.2,0.23654398918151856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,128,power_law_1.2,0.2070528030395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,128,power_law_1.2,0.24186880588531495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,128,power_law_1.2,0.2174976110458374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,128,power_law_1.2,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,128,power_law_1.2,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,128,power_law_1.2,0.24206080436706542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,128,power_law_1.2,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,128,power_law_1.2,0.26664960384368896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,128,power_law_1.2,0.3043328046798706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,128,power_law_1.2,0.35143680572509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,128,power_law_1.2,0.4388864040374756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,128,power_law_1.2,0.5142528057098389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,128,power_law_1.2,0.7948287963867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,128,power_law_1.2,1.0510335922241212
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,128,power_law_1.2,1.6578559875488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,128,power_law_1.2,1.9544063568115235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,128,power_law_1.2,2.9038591384887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,128,power_law_1.2,5.165875244140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,4,power_law_1.01,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,4,power_law_1.01,0.06388480067253113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,4,power_law_1.01,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,2,power_law_1.2,4.641996765136719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,4,power_law_1.01,0.07659519910812378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,4,power_law_1.01,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,4,power_law_1.01,0.1615872025489807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,4,power_law_1.01,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,4,power_law_1.01,0.24125440120697023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,4,power_law_1.01,0.24388480186462402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,4,power_law_1.01,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,4,power_law_1.01,0.23511040210723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,4,power_law_1.01,0.24821760654449462
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,4,power_law_1.01,0.2707456111907959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,4,power_law_1.01,0.26499199867248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,4,power_law_1.01,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,4,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,4,power_law_1.01,0.32624640464782717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,4,power_law_1.01,0.35246078968048095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,4,power_law_1.01,0.40222721099853515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,4,power_law_1.01,0.5230591773986817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,4,power_law_1.01,0.7030655860900878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,4,power_law_1.01,1.1069439888000487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,4,power_law_1.01,1.4483455657958983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,4,power_law_1.01,2.023423957824707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,4,power_law_1.01,2.699654388427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,4,power_law_1.01,4.0052734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,4,power_law_1.01,5.429452896118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,16,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,16,power_law_1.01,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,16,power_law_1.01,0.41553921699523927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,16,power_law_1.01,0.40468478202819824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,16,power_law_1.01,0.41635842323303224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,16,power_law_1.01,0.4272128105163574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,16,power_law_1.01,0.36126720905303955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,16,power_law_1.01,0.3637248039245605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,16,power_law_1.01,0.33955841064453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,16,power_law_1.01,0.38010880947113035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,16,power_law_1.01,0.3694591999053955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,16,power_law_1.01,0.39792640209198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,16,power_law_1.01,0.3772416114807129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,16,power_law_1.01,0.40038399696350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,16,power_law_1.01,0.39791359901428225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,16,power_law_1.01,0.4312960147857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,16,power_law_1.01,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,16,power_law_1.01,0.4823040008544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,16,power_law_1.01,0.5134335994720459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,16,power_law_1.01,0.571392011642456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,16,power_law_1.01,0.6158336162567138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,16,power_law_1.01,0.7624576091766357
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,16,power_law_1.01,0.9011136054992676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,16,power_law_1.01,1.1808768272399903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,16,power_law_1.01,1.6242687225341796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,16,power_law_1.01,2.271232032775879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,16,power_law_1.01,3.161497688293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,64,power_law_1.01,0.3184639930725098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,64,power_law_1.01,0.29040639400482177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,64,power_law_1.01,0.2899967908859253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,64,power_law_1.01,0.28424320220947263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,64,power_law_1.01,0.2308095932006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,64,power_law_1.01,0.2809664011001587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,64,power_law_1.01,0.28180480003356934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,64,power_law_1.01,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,64,power_law_1.01,0.2977792024612427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,64,power_law_1.01,0.27791359424591067
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,64,power_law_1.01,0.2799616098403931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,64,power_law_1.01,0.2924544095993042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,64,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,64,power_law_1.01,0.3010560035705566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,64,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,64,power_law_1.01,0.31088640689849856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,64,power_law_1.01,0.30760960578918456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,64,power_law_1.01,0.33402879238128663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,64,power_law_1.01,0.3739583969116211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,64,power_law_1.01,0.39301118850708006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,64,power_law_1.01,0.47800321578979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,64,power_law_1.01,0.633241605758667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,64,power_law_1.01,0.8103936195373536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,64,power_law_1.01,1.1497471809387207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,64,power_law_1.01,1.3918208122253417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,64,power_law_1.01,2.219385528564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,64,power_law_1.01,3.059481620788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,32,balanced,0.07167999943097432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,32,balanced,0.06946133573849995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,32,balanced,0.06331733365853627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,32,balanced,0.30873600641886395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,32,balanced,0.5925546487172445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,32,balanced,0.7297706604003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,32,balanced,0.7304373582204183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,32,balanced,0.7278933525085449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,32,balanced,0.7287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,32,balanced,0.7289173603057861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,32,balanced,0.7323306401570638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,32,balanced,0.7354026635487875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,32,balanced,0.7381333510080973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,32,balanced,0.7425706386566162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,32,balanced,0.7475199699401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,32,balanced,0.7577599684397379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,32,balanced,0.7666347026824951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,32,balanced,0.8956586519877116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,32,balanced,0.8106666405995687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,32,balanced,0.9468586444854736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,32,balanced,0.9741653601328532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,32,balanced,1.1828906536102295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,32,balanced,1.1040266354878743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,32,balanced,1.4620960553487141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,32,balanced,1.5018666585286458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,32,balanced,2.246826648712158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,32,balanced,2.9844481150309243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,4,balanced,0.037205333511034645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,4,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,4,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,4,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,4,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,4,balanced,0.18773333231608072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,4,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,4,balanced,0.19131733973821005
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,4,balanced,0.1925119956334432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,4,balanced,0.19316800435384116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,4,balanced,0.19404800732930502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,4,balanced,0.19675199190775552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,4,balanced,0.19831466674804688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,4,balanced,0.20358399550120035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,4,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,4,balanced,0.21248000860214233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,4,balanced,0.222378671169281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,4,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,4,balanced,0.2619733413060506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,4,balanced,0.29796799023946124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,4,balanced,0.36881065368652344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,4,balanced,0.4036266803741455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,4,balanced,0.4875946839650472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,4,balanced,0.7734613418579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,4,balanced,1.0707626342773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,4,balanced,1.6334506670633953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,4,balanced,2.189823945363363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,8,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,8,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,8,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,8,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,8,balanced,0.5367466608683268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,8,balanced,1.0504533449808757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,8,balanced,1.0547200043996174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,8,balanced,1.0403839747111003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,8,balanced,1.0453333059946697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,8,balanced,1.0478933652242024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,8,balanced,1.0533546606699626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,8,balanced,1.087488015492757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,8,balanced,1.062058687210083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,8,balanced,1.0712746779123943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,8,balanced,1.0825386842091878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,8,balanced,1.0926079750061035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,8,balanced,1.1136000156402588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,8,balanced,1.1622400283813477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,8,balanced,1.1973973115285237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,8,balanced,1.2718079884847004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,8,balanced,1.3552640279134114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,8,balanced,1.5170559883117676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,8,balanced,1.6469333966573079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,8,balanced,2.005674680074056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,8,balanced,2.422272046407064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,8,balanced,3.174912134806315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,8,balanced,3.9710718790690103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,4,power_law_1.2,1.1333632469177246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,4,power_law_1.2,1.6029695510864257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,4,power_law_1.2,2.2151168823242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,4,power_law_1.2,2.7197439193725588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,4,power_law_1.2,3.1899648666381837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,4,power_law_1.2,4.776140975952148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,4,power_law_1.2,4.786790466308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,4,power_law_1.2,4.852121734619141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,4,power_law_1.2,4.922163009643555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,4,power_law_1.2,4.802969741821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,4,power_law_1.2,4.823244857788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,4,power_law_1.2,5.218304061889649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,16,power_law_1.01,0.23653120994567872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,16,power_law_1.01,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,4,power_law_1.2,5.309011077880859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,16,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,16,power_law_1.01,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,16,power_law_1.01,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,4,power_law_1.2,5.600665664672851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,16,power_law_1.01,0.2756608009338379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,16,power_law_1.01,0.27832319736480715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,16,power_law_1.01,0.2766848087310791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,4,power_law_1.2,5.804646301269531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,16,power_law_1.01,0.2664448022842407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,1,balanced,0.3834880193074544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,16,power_law_1.01,0.2689023971557617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,1,balanced,0.6678187052408854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,4,power_law_1.2,5.681151962280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,16,power_law_1.01,0.2736128091812134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,1,balanced,1.3011626402537029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,16,power_law_1.01,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,1,balanced,2.559658686319987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,16,power_law_1.01,0.2836479902267456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,16,power_law_1.01,0.28549120426177976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,16,power_law_1.01,0.3008255958557129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,4,power_law_1.2,5.8796031951904295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,1,balanced,5.0744320551554365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,16,power_law_1.01,0.30453760623931886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,16,power_law_1.01,0.32665600776672366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,16,power_law_1.01,0.33136639595031736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,16,power_law_1.01,0.392192006111145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,4,power_law_1.2,6.289408111572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,16,power_law_1.01,0.42678399085998536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,1,balanced,10.105514526367188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,16,power_law_1.01,0.5230591773986817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,16,power_law_1.01,0.7053311824798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,4,power_law_1.2,6.631629180908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,16,power_law_1.01,0.8574975967407227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,1,balanced,10.12053362528483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,16,power_law_1.01,1.2935168266296386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,4,power_law_1.2,7.3353218078613285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,1,balanced,10.13811175028483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,16,power_law_1.01,1.8876415252685548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,4,power_law_1.2,8.122163391113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,16,power_law_1.01,2.646835136413574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,1,balanced,10.157056172688803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,16,power_law_1.01,3.2501758575439452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,1,balanced,10.172245025634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,4,power_law_1.2,10.193920135498047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,1,balanced,10.200063705444336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,4,power_law_1.2,10.660249328613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,1,balanced,10.232490539550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,1,balanced,10.257919947306315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,1,balanced,10.315776189168295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,1,balanced,10.371920267740885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,1,balanced,10.424661636352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,4,power_law_1.2,14.227456665039062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,1,balanced,10.526543935139975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,1,balanced,11.070293426513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,1,balanced,11.263999938964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,4,power_law_1.2,15.98382110595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,1,balanced,11.698346455891928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,1,balanced,12.262730916341146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,1,balanced,12.571647644042969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,1,balanced,12.422655741373697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,4,power_law_1.2,24.69416961669922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,1,balanced,13.551104227701822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,1,balanced,14.943061828613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,1,balanced,17.908735911051433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,1,balanced,22.892201741536457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,4,power_law_1.2,31.34422912597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,8,power_law_1.01,0.43376641273498534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,8,power_law_1.01,0.7563263893127441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,8,power_law_1.01,0.6377088069915772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,8,power_law_1.01,0.7946239948272705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,8,power_law_1.01,1.0065919876098632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,8,power_law_1.01,0.9719807624816894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,8,power_law_1.01,0.9758720397949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,8,power_law_1.01,0.9979904174804688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,8,power_law_1.01,0.9656255722045899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,8,power_law_1.01,0.9422847747802734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,8,power_law_1.01,0.9574399948120117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,8,power_law_1.01,0.9746432304382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,8,power_law_1.01,1.033625602722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,8,power_law_1.01,1.0512255668640136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,8,power_law_1.01,1.043660831451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,8,power_law_1.01,1.0493951797485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,8,power_law_1.01,1.1063296318054199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,8,power_law_1.01,1.1851776123046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,8,power_law_1.01,1.2378111839294434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,8,power_law_1.01,1.4376959800720215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,8,power_law_1.01,1.6146432876586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,8,power_law_1.01,2.0389888763427733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,8,power_law_1.01,2.186444854736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,8,power_law_1.01,2.9493247985839846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,8,power_law_1.01,3.5831680297851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,8,power_law_1.01,4.827135848999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,8,power_law_1.01,6.377062225341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,1,power_law_1.2,0.193503999710083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,1,power_law_1.2,0.3659775972366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,1,power_law_1.2,0.6924287796020507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,1,power_law_1.2,1.124556827545166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,1,power_law_1.2,1.5714303970336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,1,power_law_1.2,2.7672576904296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,1,power_law_1.2,3.010969543457031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,1,power_law_1.2,3.1133695602416993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,2,power_law_1.01,1.475379180908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,1,power_law_1.2,3.24218864440918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,2,power_law_1.01,2.877440071105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,1,power_law_1.2,3.3484798431396485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,2,power_law_1.01,3.686809539794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,1,power_law_1.2,3.5448577880859373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,1,power_law_1.2,3.6050945281982423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,2,power_law_1.01,5.949235153198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,1,power_law_1.2,3.6689918518066404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,1,power_law_1.2,3.7529407501220704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,2,power_law_1.01,8.343142700195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,1,power_law_1.2,3.7437183380126955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,1,power_law_1.2,3.7449726104736327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,1,power_law_1.2,3.7715648651123046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,2,power_law_1.01,12.68652801513672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,1,power_law_1.2,3.969004821777344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,1,power_law_1.2,4.1072639465332035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,1,power_law_1.2,4.365926361083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,2,power_law_1.01,12.935781860351563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,1,power_law_1.2,4.800921630859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,1,power_law_1.2,5.5408576965332035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,2,power_law_1.01,13.450035095214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,1,power_law_1.2,5.827993774414063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,1,power_law_1.2,7.156940460205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,2,power_law_1.01,14.007296752929687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,2,power_law_1.01,14.511923217773438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,1,power_law_1.2,8.107212829589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,1,power_law_1.2,10.756505584716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,2,power_law_1.01,14.404812622070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,2,power_law_1.01,14.85455322265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,1,power_law_1.2,13.468057250976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,2,power_law_1.01,14.608998107910157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,2,power_law_1.01,15.335833740234374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,2,power_law_1.01,16.345497131347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,2,power_law_1.01,16.265011596679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,2,power_law_1.01,17.16899871826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,2,power_law_1.01,17.500979614257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,2,power_law_1.01,18.136679077148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,2,power_law_1.01,19.100057983398436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,2,power_law_1.01,19.349913024902342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,2,128,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,2,128,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,2,128,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,2,128,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,2,128,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,2,128,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,2,128,balanced,0.051370665431022644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,2,128,balanced,0.05205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,2,128,balanced,0.05253333350022634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,2,128,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,2,128,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,2,128,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,2,128,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,2,128,balanced,0.060415998101234436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,2,128,balanced,0.06178133189678192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,2,128,balanced,0.06568000217278798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,2,128,balanced,0.0727040022611618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,2,128,balanced,0.08004266520341237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,2,128,balanced,0.1295360028743744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,2,128,balanced,0.237226665019989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,2,128,balanced,0.32255999247233075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,2,128,balanced,0.4015786647796631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,2,128,balanced,0.5613226493199667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,2,128,balanced,0.7231146494547526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,2,128,balanced,1.0804906686147053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,2,power_law_1.01,22.554623413085938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,2,128,balanced,1.4385387102762859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,2,power_law_1.01,23.012147521972658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,2,power_law_1.01,28.297012329101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,2,power_law_1.01,33.27262573242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,2,power_law_1.01,44.81535949707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,4,power_law_1.01,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,4,power_law_1.01,0.6758399963378906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,4,power_law_1.01,0.8560640335083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,4,power_law_1.01,1.245798397064209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,4,power_law_1.01,1.4135295867919921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,4,power_law_1.01,1.5708160400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,4,power_law_1.01,2.2745088577270507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,4,power_law_1.01,2.0797439575195313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,4,power_law_1.01,2.068070411682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,4,power_law_1.01,2.0590591430664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,2,power_law_1.01,51.02694396972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,4,power_law_1.01,2.3162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,4,power_law_1.01,2.293350410461426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,4,power_law_1.01,2.252595138549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,4,power_law_1.01,2.343935966491699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,4,power_law_1.01,2.2784000396728517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,4,power_law_1.01,2.4657920837402343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,4,power_law_1.01,2.4879104614257814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,4,power_law_1.01,2.669561576843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,4,power_law_1.01,2.554265594482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,4,power_law_1.01,2.7650047302246095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,4,power_law_1.01,2.997043228149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,4,power_law_1.01,3.5981311798095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,4,power_law_1.01,3.7335041046142576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,4,power_law_1.01,4.486342239379883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,4,power_law_1.01,5.195775985717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,4,power_law_1.01,7.137484741210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,4,power_law_1.01,8.792269134521485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,2,1,power_law_1.01,0.28628480434417725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,2,1,power_law_1.01,0.454860782623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,2,1,power_law_1.01,0.578764820098877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,2,1,power_law_1.01,0.9482239723205567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,2,1,power_law_1.01,1.0024959564208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,2,1,power_law_1.01,0.9848832130432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,2,1,power_law_1.01,1.04202241897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,2,1,power_law_1.01,1.0491904258728026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,2,1,power_law_1.01,1.0690560340881348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,2,1,power_law_1.01,1.0721280097961425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,2,1,power_law_1.01,1.0894975662231445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,2,1,power_law_1.01,1.105504035949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,2,1,power_law_1.01,1.1294719696044921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,2,1,power_law_1.01,1.1665408134460449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,2,1,power_law_1.01,1.224499225616455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,2,1,power_law_1.01,1.3142016410827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,2,1,power_law_1.01,1.3240320205688476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,2,1,power_law_1.01,1.6281408309936523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,2,1,power_law_1.01,1.807155227661133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,2,1,power_law_1.01,2.37772159576416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,2,1,power_law_1.01,2.8282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,2,1,power_law_1.01,3.8338558197021486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,16,power_law_1.01,0.37867519855499265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,16,power_law_1.01,0.6774784088134765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,16,power_law_1.01,0.6737919807434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,16,power_law_1.01,0.6584320068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,16,power_law_1.01,0.637337589263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,16,power_law_1.01,0.5535744190216064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,16,power_law_1.01,0.638976001739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,16,power_law_1.01,0.5871615886688233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,16,power_law_1.01,0.5971968173980713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,16,power_law_1.01,0.6027135848999023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,16,power_law_1.01,0.6205440044403077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,16,power_law_1.01,0.6410240173339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,16,power_law_1.01,0.6021120071411132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,2,1,power_law_1.01,4.8560127258300785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,16,power_law_1.01,0.6289408206939697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,16,power_law_1.01,0.6127615928649902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,16,power_law_1.01,0.6653952121734619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,16,power_law_1.01,0.6721536159515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,16,power_law_1.01,0.7045119762420654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,16,power_law_1.01,0.7548927783966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,16,power_law_1.01,0.8263680458068847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,16,power_law_1.01,0.8843263626098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,16,power_law_1.01,1.0803199768066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,16,power_law_1.01,1.2472319602966309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,16,power_law_1.01,1.5325183868408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,16,power_law_1.01,1.94150390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,16,power_law_1.01,2.5393152236938477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,16,power_law_1.01,3.3353729248046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,2,1,power_law_1.01,6.817791748046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,2,1,power_law_1.01,9.014681243896485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,32,power_law_1.2,0.6150144100189209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,32,power_law_1.2,0.5492671966552735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,32,power_law_1.2,0.551526403427124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,32,power_law_1.2,0.5640192031860352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,32,power_law_1.2,0.5070847988128662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,32,power_law_1.2,0.5326848030090332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,32,power_law_1.2,0.5289984226226807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,32,power_law_1.2,0.504422378540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,32,power_law_1.2,0.5119999885559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,32,power_law_1.2,0.5134335994720459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,32,power_law_1.2,0.5480447769165039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,32,power_law_1.2,0.5124095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,32,power_law_1.2,0.5294079780578613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,32,power_law_1.2,0.5289984226226807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,32,power_law_1.2,0.5443583965301514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,32,power_law_1.2,0.5810175895690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,32,power_law_1.2,0.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,32,power_law_1.2,0.66211838722229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,32,power_law_1.2,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,32,power_law_1.2,0.8560640335083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,32,power_law_1.2,1.023795223236084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,32,power_law_1.2,1.3942784309387206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,32,power_law_1.2,1.6549888610839845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,32,power_law_1.2,2.6093568801879883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,32,power_law_1.2,2.9415424346923826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,32,power_law_1.2,4.413235092163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,32,4,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,32,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,32,4,balanced,0.05494933327039083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,32,4,balanced,0.059903999169667564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,32,4,balanced,0.08055466910203297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,32,4,balanced,0.27460267146428424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,32,4,balanced,0.40294400850931805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,32,4,balanced,0.4060159921646118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,32,4,balanced,0.406330664952596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,32,4,balanced,0.4107786814371745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,32,4,balanced,0.4135253429412842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,32,4,balanced,0.4184746742248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,32,4,balanced,0.4220586617787679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,32,4,balanced,0.43008001645406085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,32,4,balanced,0.44115201632181805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,32,4,balanced,0.4493653376897176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,32,4,balanced,0.46882132689158124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,32,power_law_1.2,5.568921661376953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,32,4,balanced,0.507370670636495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,32,4,balanced,0.5686613321304321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,32,4,balanced,0.6640640099843343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,32,4,balanced,0.7838719685872396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,32,4,balanced,1.0977280139923096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,32,4,balanced,1.3798400561014812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,32,4,balanced,2.0094292958577475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,32,4,balanced,2.5970346132914224
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,32,4,balanced,3.6971521377563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,32,4,balanced,4.8406187693278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,2,1,power_law_1.01,13.156352233886718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,32,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,32,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,32,power_law_1.2,0.025382399559020996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,32,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,32,power_law_1.2,0.025177600979804992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,32,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,32,power_law_1.2,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,32,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,32,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,32,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,32,power_law_1.2,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,32,power_law_1.2,0.02905600070953369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,32,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,32,power_law_1.2,0.03153280019760132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,32,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,32,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,32,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,32,power_law_1.2,0.04585599899291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,32,power_law_1.2,0.04893440008163452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,32,power_law_1.2,0.0737280011177063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,32,power_law_1.2,0.09482240080833435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,32,power_law_1.2,0.12776319980621337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,32,power_law_1.2,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,32,power_law_1.2,0.34303998947143555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,32,power_law_1.2,0.496230411529541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,32,power_law_1.2,0.7000063896179199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,2,1,power_law_1.01,17.027687072753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,32,power_law_1.2,0.9711615562438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,2,power_law_1.01,0.4415487766265869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,2,power_law_1.01,0.7448575973510743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,2,power_law_1.01,0.9596927642822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,2,power_law_1.01,1.4520319938659667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,2,power_law_1.01,2.0389888763427733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,2,power_law_1.01,3.202867126464844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,2,power_law_1.01,3.4310142517089846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,2,power_law_1.01,3.365273666381836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,2,power_law_1.01,3.5069950103759764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,2,power_law_1.01,3.5586048126220704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,2,power_law_1.01,3.6913150787353515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,2,power_law_1.01,3.7138431549072264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,2,power_law_1.01,3.717734527587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,2,power_law_1.01,3.8959102630615234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,2,power_law_1.01,3.9397377014160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,2,power_law_1.01,3.9733249664306642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,2,power_law_1.01,4.170342254638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,2,power_law_1.01,4.46300163269043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,2,power_law_1.01,4.695859146118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,2,power_law_1.01,5.067161560058594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,2,power_law_1.01,5.568505477905274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,2,power_law_1.01,6.805299377441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,2,power_law_1.01,7.35436782836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,2,power_law_1.01,9.240576171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,2,power_law_1.01,11.046092987060547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,16,power_law_1.2,0.8187904357910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,2,power_law_1.01,15.532441711425781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,16,power_law_1.2,1.0457088470458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,16,power_law_1.2,1.072537612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,16,power_law_1.2,1.071718406677246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,16,power_law_1.2,1.0285056114196778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,16,power_law_1.2,0.9664511680603027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,16,power_law_1.2,0.9338879585266113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,16,power_law_1.2,0.9723903656005859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,16,power_law_1.2,0.9478143692016602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,16,power_law_1.2,0.9971712112426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,2,power_law_1.01,19.358309936523437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,16,power_law_1.2,1.032806396484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,16,power_law_1.2,1.0487808227539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,16,power_law_1.2,0.9666560173034668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,16,power_law_1.2,1.1087871551513673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,16,power_law_1.2,1.1087871551513673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,16,power_law_1.2,1.1143168449401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,16,power_law_1.2,1.1094016075134276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,16,power_law_1.2,1.2126208305358888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,16,power_law_1.2,1.2857343673706054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,16,power_law_1.2,1.4675968170166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,16,power_law_1.2,1.6953344345092773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,8,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,16,power_law_1.2,2.3789567947387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,8,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,8,power_law_1.2,0.02945919930934906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,8,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,8,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,8,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,16,power_law_1.2,2.2763519287109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,8,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,8,power_law_1.2,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,8,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,8,power_law_1.2,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,8,power_law_1.2,0.036032000184059144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,16,power_law_1.2,3.294412612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,8,power_law_1.2,0.037868800759315493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,8,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,8,power_law_1.2,0.045440000295639035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,8,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,8,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,8,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,8,power_law_1.2,0.08151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,16,power_law_1.2,3.817881774902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,8,power_law_1.2,0.15029120445251465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,8,power_law_1.2,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,8,power_law_1.2,0.30655999183654786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,8,power_law_1.2,0.4278272151947021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,16,power_law_1.2,5.860556793212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,8,power_law_1.2,0.6914048194885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,8,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,8,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,8,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,8,power_law_1.2,0.028454399108886717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,8,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,8,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,8,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,16,power_law_1.2,7.290675354003906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,8,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,8,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,8,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,8,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,8,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,8,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,8,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,8,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,8,power_law_1.2,0.06758400201797485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,8,power_law_1.2,0.09113600254058837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,8,power_law_1.2,0.13230079412460327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,8,power_law_1.2,0.13987840414047242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,8,power_law_1.2,0.18554879426956178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,8,power_law_1.2,1.1079680442810058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,8,power_law_1.2,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,8,power_law_1.2,0.4405248165130615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,8,power_law_1.2,1.8585599899291991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,1,8,balanced,0.049135997891426086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,1,8,balanced,0.06570666531721751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,1,8,balanced,0.3037866751352946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,1,8,balanced,0.5712159872055054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,1,8,balanced,1.098581314086914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,1,8,balanced,1.3624320030212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,1,8,balanced,1.366869290669759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,1,8,balanced,1.37062406539917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,1,8,balanced,1.3750613530476887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,1,8,balanced,1.3788159688313801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,1,8,balanced,1.3852799733479817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,1,8,balanced,1.3907626469930012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,1,8,balanced,1.3986132939656575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,1,8,balanced,1.4105599721272786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,1,8,balanced,1.4221653938293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,1,8,balanced,1.4361599286397297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,1,8,balanced,1.4581759770711262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,1,8,balanced,1.504085381825765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,1,8,balanced,1.5510187149047852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,1,8,balanced,1.635327974955241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,1,8,balanced,1.6873812675476074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,1,8,balanced,1.8269866307576497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,1,8,balanced,2.0157440503438315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,1,8,balanced,2.5364480018615723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,1,8,balanced,3.0044161478678384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,1,8,balanced,4.401322682698567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,1,8,balanced,5.8209279378255205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,8,power_law_1.2,0.6406144142150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,4,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,4,power_law_1.01,0.2953216075897217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,4,power_law_1.01,0.4161344051361084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,4,power_law_1.01,0.5169151782989502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,4,power_law_1.01,0.5457920074462891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,4,power_law_1.01,0.6873087882995605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,4,power_law_1.01,0.842137622833252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,8,power_law_1.2,0.8857600212097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,4,power_law_1.01,0.9224191665649414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,4,power_law_1.01,0.9334783554077148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,4,power_law_1.01,0.8722432136535645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,4,power_law_1.01,0.9189248085021973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,4,power_law_1.01,0.9603072166442871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,4,power_law_1.01,0.9148415565490723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,4,power_law_1.01,1.0065919876098632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,4,power_law_1.01,1.0391488075256348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,4,power_law_1.01,1.0430272102355957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,4,power_law_1.01,1.05163516998291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,4,power_law_1.01,1.155686378479004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,4,power_law_1.01,1.1599871635437011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,4,power_law_1.01,1.315225601196289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,4,power_law_1.01,1.4233599662780763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,4,power_law_1.01,1.7778623580932618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,4,power_law_1.01,2.126233673095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,4,power_law_1.01,2.9044736862182616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,4,power_law_1.01,3.3529857635498046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,4,power_law_1.01,4.795174407958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,4,power_law_1.01,6.167756652832031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,8,power_law_1.2,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,8,power_law_1.2,2.207744026184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,4,power_law_1.01,0.6006783962249755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,4,power_law_1.01,1.0364928245544434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,4,power_law_1.01,2.0957183837890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,4,power_law_1.01,2.31014404296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,4,power_law_1.01,3.002982330322266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,4,power_law_1.01,3.4451454162597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,4,power_law_1.01,3.8604801177978514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,4,power_law_1.01,5.256396865844726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,4,power_law_1.01,5.069203186035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,4,power_law_1.01,4.6753791809082035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,4,power_law_1.01,5.0692096710205075
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,4,power_law_1.01,4.500672149658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,4,power_law_1.01,4.878745651245117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,4,power_law_1.01,4.8373760223388675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,4,power_law_1.01,5.3897216796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,4,power_law_1.01,5.483315277099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,4,power_law_1.01,5.652659225463867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,4,power_law_1.01,5.528166580200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,4,power_law_1.01,5.390745544433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,4,power_law_1.01,5.849702453613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,4,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,4,power_law_1.01,0.16383999586105347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,4,power_law_1.01,6.216704177856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,4,power_law_1.01,0.212172794342041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,4,power_law_1.01,0.291430401802063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,4,power_law_1.01,0.2875328063964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,4,power_law_1.01,0.3936255931854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,4,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,4,power_law_1.01,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,4,power_law_1.01,0.4132863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,4,power_law_1.01,7.141990661621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,4,power_law_1.01,0.4587200164794922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,4,power_law_1.01,0.46284799575805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,4,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,4,power_law_1.01,0.4753407955169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,4,power_law_1.01,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,4,power_law_1.01,0.4773888111114502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,4,power_law_1.01,0.497049617767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,4,power_law_1.01,7.8215171813964846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,4,power_law_1.01,0.5097472190856933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,4,power_law_1.01,0.571392011642456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,4,power_law_1.01,0.5711872100830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,4,power_law_1.01,0.661299180984497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,4,power_law_1.01,0.7458816051483155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,4,power_law_1.01,0.9889792442321778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,4,power_law_1.01,1.211571216583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,4,power_law_1.01,1.76312313079834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,4,power_law_1.01,9.333734130859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,4,power_law_1.01,2.0676607131958007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,4,power_law_1.01,3.0901952743530274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,4,power_law_1.01,4.110950469970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,4,power_law_1.01,10.068787384033204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,4,power_law_1.01,13.408460998535157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,8,power_law_1.2,2.107596778869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,4,power_law_1.01,16.00163879394531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,8,power_law_1.2,2.9169599533081056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,8,power_law_1.2,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,8,power_law_1.2,0.28446719646453855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,8,power_law_1.2,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,8,power_law_1.2,0.2791424036026001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,8,power_law_1.2,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,8,power_law_1.2,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,8,power_law_1.2,0.28631041049957273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,8,power_law_1.2,0.2883584022521973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,8,power_law_1.2,0.3358720064163208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,8,power_law_1.2,0.3375103950500488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,8,power_law_1.2,0.522438383102417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,8,power_law_1.2,0.7770112037658692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,8,power_law_1.2,0.8093695640563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,8,power_law_1.2,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,8,power_law_1.2,0.7231488227844238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,8,power_law_1.2,0.8050559997558594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,8,power_law_1.2,0.7546879768371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,8,power_law_1.2,1.0233856201171876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,8,power_law_1.2,1.2507136344909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,32,4,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,32,4,power_law_1.01,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,32,4,power_law_1.01,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,32,4,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,32,4,power_law_1.01,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,32,4,power_law_1.01,0.026214399933815004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,32,4,power_law_1.01,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,32,4,power_law_1.01,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,32,4,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,32,4,power_law_1.01,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,32,4,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,8,power_law_1.2,1.7702911376953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,32,4,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,32,4,power_law_1.01,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,32,4,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,32,4,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,32,4,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,32,4,power_law_1.01,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,32,4,power_law_1.01,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,32,4,power_law_1.01,0.07987200021743775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,32,4,power_law_1.01,0.09564160108566284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,8,power_law_1.2,2.226585578918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,8,power_law_1.2,3.201433563232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,32,4,power_law_1.01,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,32,4,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,8,power_law_1.2,4.37657585144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,32,4,power_law_1.01,0.3502079963684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,4,64,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,4,64,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,4,64,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,4,64,balanced,0.051541333397229515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,4,64,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,4,64,balanced,0.06485333542029063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,4,64,balanced,0.2182826598485311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,4,64,balanced,0.2198186715443929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,4,64,balanced,0.21998933951059976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,4,64,balanced,0.22050132354100546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,4,64,balanced,0.22152533133824667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,4,64,balanced,0.22408533096313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,4,64,balanced,0.22510933876037598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,4,64,balanced,0.22801067431767783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,4,64,balanced,0.23244800170262656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,4,64,balanced,0.23432532946268717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,4,64,balanced,0.23995733261108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,4,64,balanced,0.25412267446517944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,4,64,balanced,0.27033599217732746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,4,64,balanced,0.2943999965985616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,4,64,balanced,0.31539199749628705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,4,64,balanced,0.3609600067138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,32,4,power_law_1.01,0.4831232070922852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,4,64,balanced,0.44817066192626953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,4,64,balanced,0.5333333412806193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,4,64,balanced,0.6367573340733846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,4,64,balanced,0.8722773392995199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,4,64,balanced,1.1613866488138835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,32,4,power_law_1.01,0.7825407981872559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,8,power_law_1.2,6.125568008422851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,1,balanced,0.06553600231806438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,1,balanced,0.08106666803359985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,1,balanced,0.2792106668154399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,1,balanced,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,1,balanced,1.0263893604278564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,1,balanced,2.017279942830404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,1,balanced,2.029909292856852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,1,balanced,2.0488533973693848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,1,balanced,2.066090742746989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,1,balanced,2.0804266929626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,1,balanced,2.1021013259887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,1,balanced,2.1275307337443032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,1,balanced,2.1492053667704263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,1,balanced,2.198527971903483
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,1,balanced,2.249215920766195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,1,balanced,2.2990506490071616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,1,balanced,2.3906985918680825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,32,4,power_law_1.01,1.183743953704834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,1,balanced,2.639018694559733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,1,balanced,2.8323841094970703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,1,balanced,3.215189297993978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,1,balanced,3.6857172648111978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,8,power_law_1.2,8.059494018554688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,1,balanced,4.629834810892741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,1,balanced,5.490346908569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,1,balanced,7.39686393737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,1,balanced,9.307647705078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,1,balanced,13.280768076578775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,1,balanced,16.916309356689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,32,4,power_law_1.01,1.7147775650024415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,4,power_law_1.2,0.338918399810791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,4,power_law_1.2,0.324403190612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,4,power_law_1.2,0.4239039897918701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,4,power_law_1.2,0.5488639831542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,4,power_law_1.2,0.4786111831665039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,4,power_law_1.2,0.533894395828247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,4,power_law_1.2,0.5410687923431396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,4,power_law_1.2,0.5556223869323731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,4,power_law_1.2,0.6088704109191895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,4,power_law_1.2,0.6158336162567138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,4,power_law_1.2,0.6571839809417724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,4,power_law_1.2,0.7634943962097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,4,power_law_1.2,0.8165375709533691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,4,power_law_1.2,0.7751488208770752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,4,power_law_1.2,0.8507391929626464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,4,power_law_1.2,0.9768959999084472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,4,power_law_1.2,1.1499520301818849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,4,power_law_1.2,1.55033597946167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,4,power_law_1.2,1.7532928466796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,4,power_law_1.2,2.409459114074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,4,power_law_1.2,2.769887924194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,4,power_law_1.2,3.9219200134277346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,8,power_law_1.2,12.245811462402344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,4,power_law_1.2,5.088051223754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,32,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,32,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,32,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,32,power_law_1.2,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,32,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,32,power_law_1.2,0.04586879909038544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,32,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,32,power_law_1.2,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,32,power_law_1.2,0.04872959852218628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,32,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,32,power_law_1.2,0.050995200872421265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,32,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,32,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,32,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,32,power_law_1.2,0.06000639796257019
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,32,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,32,power_law_1.2,0.06878079771995545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,32,power_law_1.2,0.0796671986579895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,32,power_law_1.2,0.12615679502487182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,32,power_law_1.2,0.21913599967956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,32,power_law_1.2,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,32,power_law_1.2,0.41143040657043456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,32,power_law_1.2,0.5541888236999511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,32,power_law_1.2,0.8482815742492675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,32,power_law_1.2,1.2890111923217773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,32,power_law_1.2,1.9345407485961914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,32,power_law_1.2,2.7873279571533205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,4,power_law_1.2,6.861004638671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,8,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,8,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,8,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,8,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,8,balanced,0.06364800035953522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,8,balanced,0.2739199995994568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,8,balanced,0.40533332029978436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,8,balanced,0.4116479953130086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,8,balanced,0.4121599992116292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,8,balanced,0.4145493507385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,8,balanced,0.4150613149007161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,8,balanced,0.4203519821166992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,8,balanced,0.42322667439778644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,8,balanced,0.4307626485824585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,8,balanced,0.43434667587280273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,8,balanced,0.4411733150482178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,8,balanced,0.45448533693949383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,4,power_law_1.2,8.340070343017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,8,balanced,0.48024535179138184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,8,balanced,0.5200213193893433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,8,balanced,0.5852160056432089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,8,balanced,0.6367573340733846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,8,balanced,0.7765333652496338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,8,balanced,0.9576000372568766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,8,balanced,1.3475839296976726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,8,balanced,1.7566720644632976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,8,balanced,2.395136038462321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,8,balanced,3.0504961013793945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,16,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,16,power_law_1.2,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,16,power_law_1.2,0.38154239654541017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,16,power_law_1.2,0.3600383996963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,16,power_law_1.2,0.4048895835876465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,16,power_law_1.2,0.41758079528808595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,16,power_law_1.2,0.3416064023971558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,16,power_law_1.2,0.3284991979598999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,16,power_law_1.2,0.39034879207611084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,8,power_law_1.2,16.254771423339843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,16,power_law_1.2,0.3250175952911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,16,power_law_1.2,0.3510272026062012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,16,power_law_1.2,0.3383296012878418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,16,power_law_1.2,0.3925951957702637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,16,power_law_1.2,0.36863999366760253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,16,power_law_1.2,0.39342079162597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,16,power_law_1.2,0.4247551918029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,16,power_law_1.2,0.4388864040374756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,16,power_law_1.2,0.4583424091339111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,16,power_law_1.2,0.5175295829772949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,16,power_law_1.2,0.5748735904693604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,16,power_law_1.2,0.638976001739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,16,power_law_1.2,0.8202239990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,16,power_law_1.2,0.9902079582214356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,16,power_law_1.2,1.3613056182861327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,4,power_law_1.2,15.778169250488281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,16,power_law_1.2,1.818623924255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,16,power_law_1.2,2.7809791564941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,16,power_law_1.2,3.9221248626708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,4,power_law_1.2,17.171661376953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,8,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,8,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,8,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,8,power_law_1.01,0.03747200071811676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,8,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,8,power_law_1.01,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,8,power_law_1.01,0.03808639943599701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,8,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,8,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,8,power_law_1.01,0.04074879884719849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,8,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,8,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,8,power_law_1.01,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,8,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,8,power_law_1.01,0.06307839751243591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,8,power_law_1.01,0.07946239709854126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,8,power_law_1.01,0.09215999841690063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,8,power_law_1.01,0.17858560085296632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,8,power_law_1.01,0.23101439476013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,8,power_law_1.01,0.27381761074066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,8,power_law_1.01,0.3510272026062012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,8,power_law_1.01,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,8,power_law_1.01,0.5928959846496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,8,power_law_1.01,0.9760767936706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,8,power_law_1.01,1.3711359977722168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,1,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,1,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,1,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,1,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,1,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,1,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,1,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,1,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,1,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,1,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,1,balanced,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,1,balanced,0.05460800230503082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,1,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,1,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,1,balanced,0.0981333355108897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,1,balanced,0.10956799983978271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,1,balanced,0.10683733224868774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,1,balanced,0.20121600230534872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,1,balanced,0.20462934176127115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,1,balanced,0.2725546757380168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,1,balanced,0.34815998872121173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,1,balanced,0.5236053466796875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,1,balanced,0.7763626575469971
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,1,balanced,1.2202666600545247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,1,balanced,1.6498346328735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,1,balanced,2.502650737762451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,1,balanced,3.403264045715332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,4,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,4,balanced,0.027647999425729115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,4,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,4,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,4,balanced,0.04487466812133789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,4,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,4,balanced,0.03871466716130575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,4,balanced,0.039066667358080544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,4,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,4,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,4,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,4,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,4,balanced,0.043178667624791466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,4,balanced,0.04488533238569895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,4,balanced,0.05000533163547516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,4,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,4,balanced,0.07406933108965556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,4,balanced,0.1616213321685791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,4,balanced,0.20786666870117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,4,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,4,balanced,0.29422932863235474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,4,balanced,0.3942399819691976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,4,balanced,0.4968106746673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,4,balanced,0.7507627010345459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,4,balanced,1.0461866855621338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,4,balanced,1.694719950358073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,4,balanced,2.376533349355062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,4,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,4,power_law_1.01,0.15626239776611328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,4,power_law_1.01,0.13393919467926024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,4,power_law_1.01,0.23306241035461425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,4,power_law_1.01,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,4,power_law_1.01,0.4526080131530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,4,power_law_1.01,0.44031357765197754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,4,power_law_1.01,0.42045440673828127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,4,power_law_1.01,0.40857601165771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,4,power_law_1.01,0.45035519599914553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,4,power_law_1.01,0.4491263866424561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,4,power_law_1.01,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,4,power_law_1.01,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,4,power_law_1.01,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,4,power_law_1.01,0.48578557968139646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,4,power_law_1.01,0.5023744106292725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,4,power_law_1.01,0.5124095916748047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,4,power_law_1.01,0.5138432025909424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,4,power_law_1.01,0.5427199840545655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,4,power_law_1.01,0.6059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,4,power_law_1.01,0.6502399921417237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,4,power_law_1.01,0.7948287963867188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,4,power_law_1.01,0.9252863883972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,4,power_law_1.01,1.231436824798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,4,power_law_1.01,1.5077119827270509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,4,power_law_1.01,2.365228843688965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,4,power_law_1.01,2.7903743743896485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,1,balanced,0.5881173213322958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,1,balanced,1.0289493401845295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,1,balanced,2.019498666127523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,1,balanced,3.98250675201416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,1,balanced,7.902720133463542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,1,balanced,15.742635091145834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,1,balanced,23.58289082845052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,1,balanced,23.621632893880207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,1,balanced,23.661903381347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,1,balanced,23.706624348958332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,1,balanced,23.77471923828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,1,balanced,23.84179178873698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,1,balanced,23.911936442057293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,1,balanced,24.032427469889324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,1,balanced,24.136683146158855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,1,balanced,24.24302927652995
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,256,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,256,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,256,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,1,balanced,24.444414774576824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,256,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,256,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,256,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,256,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,256,power_law_1.2,0.04074240028858185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,256,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,256,power_law_1.2,0.04136959910392761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,256,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,256,power_law_1.2,0.04341759979724884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,256,power_law_1.2,0.07823359966278076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,256,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,256,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,256,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,256,power_law_1.2,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,256,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,1,balanced,24.770731608072918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,256,power_law_1.2,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,256,power_law_1.2,0.11612160205841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,256,power_law_1.2,0.1529855966567993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,256,power_law_1.2,0.24185600280761718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,256,power_law_1.2,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,256,power_law_1.2,0.5670911788940429
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,256,power_law_1.2,0.8208383560180664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,256,power_law_1.2,1.2206080436706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,256,power_law_1.2,1.7111040115356446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,1,balanced,25.072980244954426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,1,balanced,25.640106201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,1,balanced,26.23334503173828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,2,power_law_1.2,1.6275455474853515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,2,power_law_1.2,2.4420223236083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,1,balanced,27.322537740071613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,2,power_law_1.2,3.7206016540527345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,2,power_law_1.2,5.352243041992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,2,power_law_1.2,7.263846588134766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,1,balanced,28.393470764160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,2,power_law_1.2,12.029747009277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,2,power_law_1.2,13.290290832519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,1,balanced,32.65126291910807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,2,power_law_1.2,12.943154907226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,1,balanced,31.419705708821613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,2,power_law_1.2,13.999104309082032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,2,power_law_1.2,14.023269653320312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,1,balanced,36.40558878580729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,2,power_law_1.2,14.20226593017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,2,power_law_1.2,15.151922607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,2,power_law_1.2,15.430233764648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,1,balanced,45.55298360188802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,2,power_law_1.2,16.043609619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,2,power_law_1.2,16.768614196777342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,16,power_law_1.01,0.028863999247550964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,16,power_law_1.01,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,16,power_law_1.01,0.027628800272941588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,16,power_law_1.01,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,2,power_law_1.2,16.96563262939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,16,power_law_1.01,0.02537600100040436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,16,power_law_1.01,0.028249600529670717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,16,power_law_1.01,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,16,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,16,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,16,power_law_1.01,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,16,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,16,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,16,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,16,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,16,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,16,power_law_1.01,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,16,power_law_1.01,0.07311360239982605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,16,power_law_1.01,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,16,power_law_1.01,0.10751999616622925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,16,power_law_1.01,0.1462272047996521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,16,power_law_1.01,0.17469439506530762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,16,power_law_1.01,0.2957312107086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,16,power_law_1.01,0.3717119932174683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,2,power_law_1.2,17.044889831542967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,16,power_law_1.01,0.5750783920288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,16,power_law_1.01,0.6805503845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,16,power_law_1.01,1.152409553527832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,16,power_law_1.01,1.4225407600402833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,2,power_law_1.2,18.054348754882813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,2,power_law_1.2,18.572288513183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,2,power_law_1.2,19.134669494628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,2,power_law_1.2,20.524441528320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,2,power_law_1.2,23.63555908203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,2,power_law_1.2,24.651980590820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,2,power_law_1.2,31.08741149902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,2,power_law_1.2,36.33336181640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,8,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,8,balanced,0.035317334036032356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,8,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,8,balanced,0.19370667139689127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,8,balanced,0.1950719952583313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,8,balanced,0.1967786749204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,8,balanced,0.19797333081563315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,8,balanced,0.19848533471425375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,8,balanced,0.20121065775553384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,8,balanced,0.2135039965311686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,8,balanced,0.20497065782546997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,8,balanced,0.20872533321380615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,8,balanced,0.21504000822703043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,8,balanced,0.2182826598485311
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,8,balanced,0.2285226583480835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,8,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,8,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,8,balanced,0.2773226698239644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,8,balanced,0.31726932525634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,8,balanced,0.37273601690928143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,8,balanced,0.41335467497507733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,8,balanced,0.5222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,8,balanced,0.6490453481674194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,8,balanced,0.9728000164031982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,8,balanced,1.3637973467508953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,2,power_law_1.2,48.17489929199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,2,balanced,0.23432532946268717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,2,balanced,0.4509013493855794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,2,balanced,0.8374613126118978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,2,balanced,1.495039939880371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,2,balanced,2.8866453170776367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,2,balanced,4.131834665934245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,2,balanced,4.149077415466309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,2,balanced,4.163242657979329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,2,balanced,4.185770670572917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,2,balanced,4.2014719645182295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,2,balanced,4.2294613520304365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,2,balanced,4.263423919677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,2,balanced,4.2926025390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,2,balanced,4.3412478764851885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,2,balanced,4.390912055969238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,2,balanced,4.434432029724121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,2,balanced,4.532906532287598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,2,balanced,4.715349197387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,2,balanced,4.8192853927612305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,2,power_law_1.2,55.0434814453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,2,balanced,5.08842658996582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,2,balanced,5.389823913574219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,2,balanced,6.08290163675944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,2,balanced,6.763861338297526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,2,balanced,8.43178685506185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,2,balanced,10.148864110310873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,2,balanced,13.751295725504557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,2,balanced,17.443157196044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,4,8,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,4,8,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,4,8,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,4,8,balanced,0.10427733262379964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,4,8,balanced,0.30771199862162274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,4,8,balanced,0.3771626551946004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,4,8,balanced,0.3792213201522827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,4,8,balanced,0.38177065054575604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,4,8,balanced,0.3838293155034383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,4,8,balanced,0.38519465923309326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,4,8,balanced,0.38860801855723065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,4,8,balanced,0.3930453459421794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,4,8,balanced,0.3964586655298869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,4,8,balanced,0.40396801630655926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,4,8,balanced,0.4131840070088704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,4,8,balanced,0.4184746742248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,4,8,balanced,0.43025068442026776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,4,8,balanced,0.4585813283920288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,4,8,balanced,0.4927146832148234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,4,8,balanced,0.5379413366317749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,4,8,balanced,0.5751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,4,8,balanced,0.6795946756998698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,4,8,balanced,0.7987146377563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,4,8,balanced,1.117525339126587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,4,8,balanced,1.498794714609782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,4,8,balanced,2.1811092694600425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,4,8,balanced,2.8636159896850586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.039699199795722964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.20602879524230958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.21850240230560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.21913599967956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.23388159275054932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.2451456069946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.2551487922668457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.30167040824890134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.3141439914703369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.3225600004196167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.35389440059661864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.430079984664917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.5349247932434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.7903232097625732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,1,power_law_1.01,1.0483712196350097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,1,power_law_1.01,1.5177727699279786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,1,power_law_1.01,1.9906560897827148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,1,power_law_1.01,3.0314495086669924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,1,power_law_1.01,4.063398361206055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,1,power_law_1.01,6.178611373901367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,1,power_law_1.01,8.305049896240234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.07454720139503479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.20398080348968506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.31703040599822996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.41021437644958497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.743833589553833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.8032256126403808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.8411135673522949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.841318416595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.87838716506958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.89169921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.932863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.9498623847961426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.9738240242004395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.9891839981079101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,1,power_law_1.2,1.0457088470458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,1,power_law_1.2,1.0704895973205566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,1,power_law_1.2,1.1726847648620606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,1,power_law_1.2,1.3137920379638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,1,power_law_1.2,1.5673343658447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,1,power_law_1.2,1.8325376510620117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,1,power_law_1.2,2.3533504486083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,1,power_law_1.2,2.7994112014770507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,1,power_law_1.2,3.948953628540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,1,power_law_1.2,5.0143169403076175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,1,power_law_1.2,7.326924896240234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,8,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,8,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,8,power_law_1.2,0.0899071991443634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,8,power_law_1.2,0.11755520105361938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,8,power_law_1.2,0.12431360483169555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,8,power_law_1.2,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,8,power_law_1.2,0.23060479164123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,8,power_law_1.2,0.24883201122283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,8,power_law_1.2,0.24043519496917726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,8,power_law_1.2,0.24798719882965087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,8,power_law_1.2,0.25678720474243166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,8,power_law_1.2,0.26255359649658205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,8,power_law_1.2,0.2525183916091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,8,power_law_1.2,0.2535423994064331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,8,power_law_1.2,0.2809727907180786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,8,power_law_1.2,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,8,power_law_1.2,0.3010560035705566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,8,power_law_1.2,0.32931840419769287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,8,power_law_1.2,0.3463167905807495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,8,power_law_1.2,0.41491198539733887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,8,power_law_1.2,0.47472639083862306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,8,power_law_1.2,0.6901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,8,power_law_1.2,0.8398847579956055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,8,power_law_1.2,1.336524772644043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,8,power_law_1.2,1.6347135543823241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,1,power_law_1.2,9.631129455566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,8,power_law_1.2,2.534809684753418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.10629119873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.23490560054779053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.5119999885559082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.5029888153076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.531660795211792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.5269504070281983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.5494656085968017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.5369855880737304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.5570559978485108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.5672895908355713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.5689343929290771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.5642240047454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.5748735904693604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.6184959888458252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.6234111785888672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.6600639820098877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.8071167945861817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.873465633392334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,1,power_law_1.2,1.0500096321105956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,1,power_law_1.2,1.308467197418213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,128,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,128,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,128,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,128,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,128,power_law_1.2,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,128,power_law_1.2,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,128,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,1,power_law_1.2,1.7954816818237305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,128,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,128,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,128,power_law_1.2,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,128,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,128,power_law_1.2,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,128,power_law_1.2,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,128,power_law_1.2,0.06347519755363465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,128,power_law_1.2,0.06819199919700622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,128,power_law_1.2,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,128,power_law_1.2,0.08376320004463196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,128,power_law_1.2,0.12677119970321654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,128,power_law_1.2,0.18042880296707153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,128,power_law_1.2,0.2592639923095703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,128,power_law_1.2,0.34037759304046633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,128,power_law_1.2,0.4681727886199951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,128,power_law_1.2,0.6795263767242432
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,128,power_law_1.2,0.97259521484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,128,power_law_1.2,1.3314047813415528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,128,power_law_1.2,2.1565439224243166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,128,power_law_1.2,3.083673667907715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,4,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,4,power_law_1.01,0.14499839544296264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,1,power_law_1.2,2.332057571411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,4,power_law_1.01,0.2160640001296997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,4,power_law_1.01,0.2775039911270142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,4,power_law_1.01,0.31641600131988523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,4,power_law_1.01,0.4005887985229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,4,power_law_1.01,0.40611839294433594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,4,power_law_1.01,0.4143104076385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,4,power_law_1.01,0.43683838844299316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,4,power_law_1.01,0.454041576385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,4,power_law_1.01,0.44400639533996583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,4,power_law_1.01,0.4743167877197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,4,power_law_1.01,0.4603903770446777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,4,power_law_1.01,0.4734975814819336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,4,power_law_1.01,0.48721919059753416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,4,power_law_1.01,0.49643521308898925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,4,power_law_1.01,0.4898816108703613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,8,power_law_1.2,3.382681655883789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,4,power_law_1.01,0.5498879909515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,4,power_law_1.01,0.6012800216674805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,4,power_law_1.01,0.6637567996978759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,4,power_law_1.01,0.7690239906311035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,4,power_law_1.01,1.0223615646362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,4,power_law_1.01,1.177190399169922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,4,power_law_1.01,1.7412096023559571
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,4,power_law_1.01,2.0998144149780273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,4,power_law_1.01,3.1670272827148436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,4,power_law_1.01,4.5101055145263675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,1,power_law_1.01,0.07045120000839233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,1,power_law_1.01,0.30351359844207765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,1,power_law_1.01,0.5517312049865722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,1,power_law_1.01,1.0248191833496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,1,power_law_1.01,1.8718719482421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,1,power_law_1.01,2.6011648178100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,1,power_law_1.01,3.055379295349121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,1,power_law_1.2,3.452102279663086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,1,power_law_1.01,3.9774208068847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,1,power_law_1.01,4.153753662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,1,power_law_1.01,4.312051010131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,1,power_law_1.01,4.476518249511718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,1,power_law_1.2,4.425113677978516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,1,power_law_1.01,4.712652969360351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,1,power_law_1.01,4.714495849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,1,power_law_1.01,4.930355072021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,1,power_law_1.01,5.007148742675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,8,2,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,1,power_law_1.01,5.241651153564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,8,2,balanced,0.0382080003619194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,8,2,balanced,0.24593067169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,8,2,balanced,0.24678399165471396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,8,2,balanced,0.24780799945195517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,8,2,balanced,0.24985599517822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,8,2,balanced,0.2510506709416707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,8,2,balanced,0.25034133593241376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,8,2,balanced,0.25172799825668335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,8,2,balanced,0.25309866666793823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,8,2,balanced,0.2571946581204732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,8,2,balanced,0.26129066944122314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,8,2,balanced,0.265557328859965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,8,2,balanced,0.26450665791829425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,8,2,balanced,0.272213339805603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,8,2,balanced,0.276309331258138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,1,power_law_1.01,5.31517448425293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,8,2,balanced,0.28279467423756915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,8,2,balanced,0.3141973416010539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,8,2,balanced,0.35498666763305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,8,2,balanced,0.4326346715291341
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,8,2,balanced,0.5374293327331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,1,power_law_1.01,5.752627182006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,8,2,balanced,0.777557373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,8,2,balanced,1.0712746779123943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,8,2,balanced,1.6721919377644856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,8,2,balanced,2.2935892740885415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,1,power_law_1.01,6.039347076416016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,8,2,balanced,3.5411628087361655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,1,power_law_1.01,6.584524536132813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,8,2,balanced,4.6469119389851885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,1,power_law_1.01,7.013375854492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,1,power_law_1.01,7.718911743164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,1,power_law_1.01,8.495494079589843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,1,power_law_1.01,10.190847778320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,1,power_law_1.01,11.993497467041015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,1,power_law_1.01,15.750924682617187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,1,power_law_1.01,19.328614807128908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,1,power_law_1.2,6.352896118164063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,4,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,4,balanced,0.05256533126036326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,4,balanced,0.05648000041643778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,4,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,4,balanced,0.27611732482910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,4,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,4,balanced,0.5435733397801717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,4,balanced,0.5358933210372925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,4,balanced,0.5398186842600504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,4,balanced,0.544597347577413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,4,balanced,0.5532960096995035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,4,balanced,0.5531306664148966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,4,balanced,0.5614933172861735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,4,balanced,0.5623466571172079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,4,balanced,0.5807786782582601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,4,balanced,0.5901653369267782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,4,balanced,0.6121813456217448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,4,balanced,0.6729333400726318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,4,balanced,0.7188159624735514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,4,balanced,0.86135466893514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,4,balanced,0.9538559913635254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,4,balanced,1.246549367904663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,4,balanced,1.5199573834737141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,4,balanced,2.113365332285563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,4,balanced,2.703359921773275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,4,balanced,3.8725973765055337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,4,balanced,5.001898765563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,1,power_law_1.2,8.180735778808593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,1,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,1,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,1,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,1,power_law_1.01,0.07720959782600403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,1,power_law_1.01,0.11141120195388794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,1,power_law_1.01,0.18575359582901002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,1,power_law_1.01,0.2713599920272827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,1,power_law_1.01,0.2836479902267456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,1,power_law_1.01,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,1,power_law_1.01,0.3014656066894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,1,power_law_1.01,0.31784958839416505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,1,power_law_1.01,0.3352576017379761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,1,power_law_1.01,0.34076800346374514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,1,power_law_1.01,0.3667968034744263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,1,power_law_1.01,0.3762176036834717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,1,power_law_1.01,0.3956736087799072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,1,power_law_1.01,0.42946557998657225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,1,power_law_1.01,0.48824319839477537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,1,power_law_1.01,0.5593088150024415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,1,power_law_1.01,0.744652795791626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,1,power_law_1.01,0.9332736015319825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,1,power_law_1.01,1.3103103637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,1,power_law_1.01,1.6785408020019532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,1,power_law_1.01,2.429952049255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,1,power_law_1.01,3.225804901123047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,1,power_law_1.01,4.876902389526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,1,power_law_1.01,6.508748626708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,32,power_law_1.01,1.1722751617431642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,32,power_law_1.01,1.0702848434448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,32,power_law_1.01,1.062502384185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,32,power_law_1.01,1.0690560340881348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,32,power_law_1.01,1.0424320220947265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,32,power_law_1.01,0.8806400299072266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,32,power_law_1.01,0.9654272079467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,32,power_law_1.01,0.9297920227050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,32,power_law_1.01,0.9652223587036133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,32,power_law_1.01,1.0078207969665527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,32,power_law_1.01,0.9572287559509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,32,power_law_1.01,1.0051584243774414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,32,power_law_1.01,1.0573823928833008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,32,power_law_1.01,1.054310417175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,32,power_law_1.01,1.037715244293213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,32,power_law_1.01,1.0145792007446288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,32,power_law_1.01,1.0835968017578126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,32,power_law_1.01,1.1008000373840332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,32,power_law_1.01,1.2095487594604493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,32,power_law_1.01,1.3195263862609863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,32,power_law_1.01,1.5820799827575684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,16,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,32,power_law_1.01,1.9603456497192382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,16,power_law_1.01,0.030905601382255555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,16,power_law_1.01,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,16,power_law_1.01,0.027833598852157592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,16,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,32,power_law_1.01,2.1303295135498046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,16,power_law_1.01,0.02906239926815033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,16,power_law_1.01,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,16,power_law_1.01,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,16,power_law_1.01,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,16,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,16,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,32,power_law_1.01,2.893824005126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,16,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,16,power_law_1.01,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,16,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,16,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,16,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,16,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,16,power_law_1.01,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,32,power_law_1.01,3.147980880737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,16,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,16,power_law_1.01,0.08355839848518372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,16,power_law_1.01,0.11018240451812744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,16,power_law_1.01,0.24084479808807374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,16,power_law_1.01,0.31191039085388184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,16,power_law_1.01,0.4564608097076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,32,power_law_1.01,4.623155212402343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,16,power_law_1.01,0.7172095775604248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,16,power_law_1.01,1.1147135734558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,16,power_law_1.01,1.6134143829345704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,32,power_law_1.01,6.43399658203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,4,power_law_1.2,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,4,power_law_1.2,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,4,power_law_1.2,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,4,power_law_1.2,0.2136064052581787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,4,power_law_1.2,0.20295679569244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,4,power_law_1.2,0.3248127937316895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,4,power_law_1.2,0.3432447910308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,4,power_law_1.2,0.349183988571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,4,power_law_1.2,0.3758080005645752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,4,power_law_1.2,0.3647423982620239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,4,power_law_1.2,0.3950592041015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,4,power_law_1.2,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,4,balanced,0.026943999032179516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,4,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,4,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,4,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,4,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,4,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,4,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,4,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,4,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,4,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,4,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,4,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,4,power_law_1.2,0.39342079162597654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,4,balanced,0.038549333810806274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,4,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,4,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,4,power_law_1.2,0.42311677932739256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,4,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,4,power_law_1.2,0.43827199935913086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,4,balanced,0.048783997694651283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,4,balanced,0.06109866499900818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,4,balanced,0.067071999112765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,4,balanced,0.14284800489743552
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,4,balanced,0.21742933988571167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,4,balanced,0.31539199749628705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,4,balanced,0.4135253429412842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,4,balanced,0.6707200209299723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,4,power_law_1.2,0.44462080001831056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,4,balanced,0.9321813583374023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,4,power_law_1.2,0.4745215892791748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,4,balanced,1.6320853233337402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,4,power_law_1.2,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,4,power_law_1.2,0.571392011642456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,4,balanced,2.280618667602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,4,power_law_1.2,0.7030784130096436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,4,power_law_1.2,0.8998911857604981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,4,power_law_1.2,1.1919360160827637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,4,power_law_1.2,1.624883270263672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,4,power_law_1.2,2.3203840255737305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,4,power_law_1.2,2.67325439453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,8,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,8,balanced,0.030181333422660828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,8,balanced,0.0305173322558403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,8,balanced,0.22527466217676798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,8,balanced,0.3667466640472412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,8,balanced,0.48636798063913983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,8,balanced,0.48739198843638104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,8,balanced,0.4858880043029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,4,power_law_1.2,4.540825653076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,8,balanced,0.4889599879582723
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,8,balanced,0.4891306559244792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,8,balanced,0.49134933948516846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,8,balanced,0.4939093192418416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,8,balanced,0.49561599890391034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,8,balanced,0.5220693349838257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,8,balanced,0.5044906536738077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,8,balanced,0.5073920090993246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,8,balanced,0.5138773520787557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,8,balanced,0.5178026755650839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,8,balanced,0.5294080177942911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,8,balanced,0.5376000006993612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,8,balanced,0.5562026500701904
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,8,balanced,0.6126933495203654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,8,balanced,0.652458667755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,8,balanced,0.8041813373565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,8,balanced,0.8669866720835367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,8,balanced,1.2293120225270588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,8,balanced,1.5115946133931477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,4,power_law_1.2,5.989990234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,8,balanced,0.04401599864164988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,8,balanced,0.04862933357556661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,8,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,8,balanced,0.28569600979487103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,8,balanced,0.4225706656773885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,8,balanced,0.5573973258336385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,8,balanced,0.5608106851577759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,8,balanced,0.5529599984486898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,8,balanced,0.5549866755803426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,8,balanced,0.5573973258336385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,8,balanced,0.5609546502431234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,8,balanced,0.566271980603536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,8,balanced,0.5708800156911215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,8,balanced,0.578549345334371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,8,balanced,0.5913600126902262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,8,balanced,0.5997013250986735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,8,balanced,0.6179519891738892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,8,balanced,0.6580906709035238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,8,balanced,0.6949546337127686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,8,balanced,0.7611733277638754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,8,balanced,0.8370880285898844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,8,balanced,1.0226346651713054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,8,balanced,1.2257280349731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,8,balanced,1.6718506813049316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,8,balanced,1.8984959920247395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,8,balanced,2.866175969441732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,8,balanced,3.78111998240153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,1,power_law_1.01,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,1,power_law_1.01,0.0749504029750824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,1,power_law_1.01,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,1,power_law_1.01,0.4833280086517334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,1,power_law_1.01,0.6889472007751465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,1,power_law_1.01,1.0919936180114747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,1,power_law_1.01,1.1681792259216308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,1,power_law_1.01,1.1689984321594238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,1,power_law_1.01,1.231052780151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,1,power_law_1.01,1.2691455841064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,1,power_law_1.01,1.3094911575317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,1,power_law_1.01,1.3330431938171388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,1,power_law_1.01,1.3660160064697267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,1,power_law_1.01,1.4245887756347657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,1,power_law_1.01,1.4516223907470702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,1,power_law_1.01,1.520639991760254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,1,power_law_1.01,1.6066560745239258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,1,power_law_1.01,1.7543167114257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,1,power_law_1.01,1.9394559860229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,1,power_law_1.01,2.283110427856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,1,power_law_1.01,2.596249580383301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,1,power_law_1.01,3.2083969116210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,1,power_law_1.01,3.6823040008544923
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,1,power_law_1.01,4.914380645751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,1,power_law_1.01,6.293094253540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,1,power_law_1.01,9.146163177490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,1,power_law_1.01,11.848703765869141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,1,power_law_1.01,1.7702911376953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,1,power_law_1.01,3.175833511352539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,1,power_law_1.01,4.200447845458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,1,power_law_1.01,6.614220428466797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,1,power_law_1.01,6.804889678955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,1,power_law_1.01,7.001702117919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,1,power_law_1.01,7.27673568725586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,1,power_law_1.01,7.602175903320313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,1,power_law_1.01,8.59688949584961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,1,power_law_1.01,9.100287628173827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,1,power_law_1.01,8.114380645751954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,1,power_law_1.01,8.664678192138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,1,power_law_1.01,9.091891479492187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,1,power_law_1.01,10.433945465087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,1,power_law_1.01,11.7032958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,1,power_law_1.01,12.571443176269531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,1,power_law_1.01,15.406694030761718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,1,power_law_1.01,19.972915649414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,4,power_law_1.01,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,4,power_law_1.01,0.3919872045516968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,4,power_law_1.01,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,1,power_law_1.01,23.921868896484376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,4,power_law_1.01,0.5490687847137451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,4,power_law_1.01,0.6383615970611572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,4,power_law_1.01,0.9091072082519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,4,power_law_1.01,0.9566207885742187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,4,power_law_1.01,0.9422656059265136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,4,power_law_1.01,0.9236479759216308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,4,power_law_1.01,0.952729606628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,4,power_law_1.01,0.9377408027648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,4,power_law_1.01,0.9783295631408692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,4,power_law_1.01,0.9887359619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,4,power_law_1.2,0.022316800057888032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,4,power_law_1.2,0.022118400037288665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,4,power_law_1.01,1.024409580230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,4,power_law_1.2,0.023347200453281404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,4,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,4,power_law_1.01,1.0866687774658204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,4,power_law_1.2,0.026009601354599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,4,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,4,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,4,power_law_1.01,1.0827775955200196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,4,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,4,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,4,power_law_1.01,1.1144895553588867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,4,power_law_1.2,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,4,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,4,power_law_1.01,1.2267519950866699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,4,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,4,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,4,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,16,4,power_law_1.2,0.02905600070953369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,4,power_law_1.01,1.3313983917236327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,16,4,power_law_1.2,0.026624000072479247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,4,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,1,power_law_1.01,29.457818603515626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,16,4,power_law_1.2,0.026822400093078614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,4,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,16,4,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,4,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,16,4,power_law_1.2,0.02744320034980774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,4,power_law_1.01,1.5738880157470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,16,4,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,4,power_law_1.2,0.09052159786224365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,16,4,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,4,power_law_1.2,0.10240000486373901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,16,4,power_law_1.2,0.028672000765800475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,4,power_law_1.2,0.17141760587692262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,16,4,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,4,power_law_1.01,1.7190719604492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,4,power_law_1.2,0.19844479560852052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,4,power_law_1.2,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,16,4,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,4,power_law_1.01,2.2405120849609377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,16,4,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,16,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,16,4,power_law_1.2,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,4,power_law_1.01,2.5571327209472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,16,4,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,16,4,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,16,4,power_law_1.2,0.053452801704406736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,4,power_law_1.01,3.488972854614258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,16,4,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,4,power_law_1.01,3.9876609802246095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,1,power_law_1.01,35.19590454101562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,16,4,power_law_1.2,0.08704000115394592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,4,power_law_1.01,5.983846282958984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,1,64,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,1,64,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,1,64,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,1,64,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,1,64,balanced,0.03941333293914795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,1,64,balanced,0.19165867567062378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,1,64,balanced,0.192848006884257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,1,64,balanced,0.19317867358525595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,1,64,balanced,0.19353600343068442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,1,64,balanced,0.19370667139689127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,1,64,balanced,0.19490132729212442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,1,64,balanced,0.19592533508936563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,16,4,power_law_1.2,0.1026047945022583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,4,power_law_1.01,7.715020751953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,4,power_law_1.2,0.37457919120788574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,1,64,balanced,0.1971199909845988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,1,64,balanced,0.19985065857569376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,1,64,balanced,0.20341867208480835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,1,64,balanced,0.20494933923085532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,1,64,balanced,0.20770132541656494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,1,64,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,1,64,balanced,0.22818134228388467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,4,power_law_1.2,0.5662720203399658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,1,64,balanced,0.24233599503835043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,1,64,balanced,0.2508693337440491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,1,64,balanced,0.28893866141637164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,1,64,balanced,0.30446932713190716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,16,4,power_law_1.2,0.14172159433364867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,1,64,balanced,0.37905065218607586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,1,64,balanced,0.39816534519195557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,1,64,balanced,0.5592746734619141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,1,64,balanced,0.6835199991861979
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,16,4,power_law_1.2,0.17448960542678832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,64,power_law_1.2,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,64,power_law_1.2,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,64,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,1,power_law_1.01,39.78670043945313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,64,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,64,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,64,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,64,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,64,power_law_1.2,0.05507199764251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,64,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,4,power_law_1.2,0.8978431701660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,64,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,64,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,64,power_law_1.2,0.058764797449111936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,64,power_law_1.2,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,64,power_law_1.2,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,64,power_law_1.2,0.06901760101318359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,64,power_law_1.2,0.07065600156784058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,16,4,power_law_1.2,0.34754559993743894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,64,power_law_1.2,0.08089600205421447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,64,power_law_1.2,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,64,power_law_1.2,0.1798143982887268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,64,power_law_1.2,0.26972160339355467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,64,power_law_1.2,0.3274751901626587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,64,power_law_1.2,0.4671487808227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,64,power_law_1.2,0.5746496200561524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,64,power_law_1.2,0.9070591926574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,64,power_law_1.2,1.1882495880126953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,64,power_law_1.2,2.1426048278808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,64,power_law_1.2,2.839347267150879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,16,4,power_law_1.2,0.47800321578979493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,1,power_law_1.01,46.89448852539063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,4,power_law_1.2,1.4804991722106933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,1,1,power_law_1.01,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,1,1,power_law_1.01,0.44851198196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,1,1,power_law_1.01,0.8693759918212891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,1,1,power_law_1.01,1.2732288360595703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,1,1,power_law_1.01,1.7672191619873048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,1,1,power_law_1.01,2.86822395324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,1,1,power_law_1.01,3.0896064758300783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,1,1,power_law_1.01,3.1442943572998048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,1,1,power_law_1.01,3.194879913330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,1,1,power_law_1.01,3.2040958404541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,1,1,power_law_1.01,3.3107967376708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,1,1,power_law_1.01,3.3662975311279295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,1,1,power_law_1.01,3.4074302673339845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,1,1,power_law_1.01,3.44903678894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,1,1,power_law_1.01,3.520512008666992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,1,1,power_law_1.01,3.571712112426758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,16,4,power_law_1.2,0.6780928134918213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,1,1,power_law_1.01,3.657932662963867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,1,1,power_law_1.01,3.812966537475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,1,1,power_law_1.01,3.9192256927490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,1,1,power_law_1.01,4.313907241821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,1,1,power_law_1.01,4.757907104492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,1,power_law_1.01,58.6197021484375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,1,1,power_law_1.01,5.68463363647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,1,1,power_law_1.01,6.717030334472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,1,1,power_law_1.01,8.834233856201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,1,1,power_law_1.01,10.310860443115235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,1,1,power_law_1.01,14.431231689453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,1,1,power_law_1.01,18.663597106933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,16,4,power_law_1.2,1.0878975868225098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,1,power_law_1.01,70.69839477539062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,4,power_law_1.2,1.8687999725341797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,1,power_law_1.01,95.73478393554687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,16,4,power_law_1.2,1.4997504234313965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,16,4,power_law_1.2,2.0535167694091796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,1,power_law_1.01,119.91551513671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,8,16,power_law_1.01,0.053235197067260744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,8,16,power_law_1.01,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,8,16,power_law_1.01,0.22527999877929689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,8,16,power_law_1.01,0.21626880168914794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,8,16,power_law_1.01,0.22446079254150392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,8,16,power_law_1.01,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,8,16,power_law_1.01,0.10362880229949951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,8,16,power_law_1.01,0.15605759620666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,8,16,power_law_1.01,0.2002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,8,16,power_law_1.01,0.1896448016166687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,8,16,power_law_1.01,0.14725120067596437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,8,16,power_law_1.01,0.21094400882720948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,8,16,power_law_1.01,0.19763200283050536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,8,16,power_law_1.01,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,8,16,power_law_1.01,0.2342911958694458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,8,16,power_law_1.01,0.25128960609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,8,16,power_law_1.01,0.2574336051940918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,8,16,power_law_1.01,0.2861056089401245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,8,16,power_law_1.01,0.3201024055480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,8,16,power_law_1.01,0.3635200023651123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,8,16,power_law_1.01,0.4272128105163574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,8,16,power_law_1.01,0.5345280170440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,8,16,power_law_1.01,0.6658048152923584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,8,16,power_law_1.01,0.9797632217407226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,8,16,power_law_1.01,1.2986368179321288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,8,16,power_law_1.01,2.093670463562012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,8,16,power_law_1.01,2.850694465637207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,8,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,8,balanced,0.025941332181294758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,8,balanced,0.0264533335963885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,8,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,8,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,8,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,8,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,8,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,8,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,8,balanced,0.032085334261258446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,8,balanced,0.03259200106064478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,8,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,8,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,8,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,8,balanced,0.03839999934037527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,8,balanced,0.038912000755469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,8,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,8,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,8,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,8,balanced,0.09864532947540283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,8,balanced,0.13738666971524557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,8,balanced,0.24388267596562704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,8,balanced,0.3123199939727783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,8,balanced,0.4556800127029419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,8,balanced,0.6283946832021078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,8,balanced,1.0635840098063152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,8,balanced,1.4412800470987956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.3110527992248535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.5914624214172364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,1,power_law_1.01,1.1214847564697266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,1,power_law_1.01,1.8411520004272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,1,power_law_1.01,2.629631996154785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,1,power_law_1.01,4.200447845458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,1,power_law_1.01,4.496352005004883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,1,power_law_1.01,4.689920043945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,1,power_law_1.01,4.75074577331543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,1,power_law_1.01,4.791686248779297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,1,power_law_1.01,4.951654434204102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,1,power_law_1.01,5.034598541259766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,1,power_law_1.01,5.169356918334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,1,power_law_1.01,5.451769638061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,1,power_law_1.01,5.63322868347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,1,power_law_1.01,5.668864059448242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,1,power_law_1.01,5.741363143920898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,1,power_law_1.01,6.218956756591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,1,power_law_1.01,6.559321594238281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,1,power_law_1.01,6.954188537597656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,1,power_law_1.01,7.196057891845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,1,power_law_1.01,8.522124481201171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,1,power_law_1.01,9.304883575439453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,1,power_law_1.2,0.5111807823181153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,1,power_law_1.2,0.7753727912902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,1,power_law_1.2,0.7677760124206543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,1,power_law_1.2,1.6943103790283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,1,power_law_1.2,1.7741823196411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,1,power_law_1.01,11.997593688964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,1,power_law_1.2,1.7106943130493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,1,power_law_1.2,1.764352035522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,1,power_law_1.2,1.7764352798461913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,1,power_law_1.2,1.8139135360717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,1,power_law_1.2,1.824153518676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,1,power_law_1.2,1.9101696014404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,1,power_law_1.01,14.927667236328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,1,power_law_1.2,2.0307968139648436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,1,power_law_1.2,2.0305919647216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,1,power_law_1.2,2.076249694824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,1,power_law_1.2,2.2007808685302734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,1,power_law_1.2,2.2947839736938476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,1,power_law_1.01,20.677427673339842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,1,power_law_1.2,2.4543231964111327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,1,power_law_1.2,2.9196224212646484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,1,power_law_1.01,26.347314453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,1,power_law_1.2,3.337625503540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,1,power_law_1.2,4.158464050292968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,1,power_law_1.2,4.841471862792969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,1,power_law_1.2,6.403890991210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,1,power_law_1.2,8.383283233642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,16,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,16,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,16,balanced,0.02199466774861018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,16,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,16,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,16,balanced,0.02881066749493281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,16,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,16,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,16,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,16,balanced,0.02935466667016347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,16,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,16,balanced,0.03137599925200144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,16,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,16,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,16,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,16,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,16,balanced,0.06451199948787689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,16,balanced,0.08533333738644917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,16,balanced,0.09676800171534221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,16,balanced,0.1616213321685791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,16,balanced,0.19660800695419312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,1,power_law_1.2,11.671756744384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,16,balanced,0.27511467536290485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,16,balanced,0.3280213276545207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,16,balanced,0.5034666856129965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,16,balanced,0.6850399971008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,8,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,8,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,8,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,8,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,8,balanced,0.17066667477289835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,8,balanced,0.37033601601918537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,8,balanced,0.3717120091120402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,8,balanced,0.3614720106124878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,8,balanced,0.3633493185043335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,8,balanced,0.36420265833536786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,8,balanced,0.366592009862264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,8,balanced,0.3694933255513509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,8,balanced,0.37085866928100586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,8,balanced,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,8,balanced,0.3809279998143514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,8,balanced,0.3848533233006795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,8,balanced,0.3930453459421794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,8,balanced,0.40960001945495605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,8,balanced,0.4278613328933716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,8,balanced,0.4602880080540975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,8,balanced,0.4952746629714966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,8,balanced,0.553984006245931
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,8,balanced,0.6034773190816244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,8,balanced,0.7237973213195801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,8,balanced,0.882858673731486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,8,balanced,1.249621311823527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,8,balanced,1.6573440233866374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,1,power_law_1.2,15.878758239746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,1,power_law_1.2,22.427647399902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,1,balanced,0.21333332856496176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,1,balanced,0.42956801255544025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,1,balanced,0.8203946749369303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,1,balanced,1.4457173347473145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,1,balanced,2.8045600255330405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,1,balanced,4.105216026306152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,1,balanced,4.132863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,1,balanced,4.162218729654948
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,1,balanced,4.1855894724528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,1,balanced,4.210858662923177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,1,balanced,4.256405194600423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,1,balanced,4.306090672810872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,1,balanced,4.346368153889974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,1,balanced,4.4270931879679365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,1,balanced,4.507818539937337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,1,balanced,4.588693300882976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,1,balanced,4.753237406412761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,1,balanced,5.101738611857097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,1,balanced,5.428053538004558
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,1,balanced,5.83082644144694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,1,balanced,6.3929704030354815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,4,4,power_law_1.01,0.18165760040283202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,4,4,power_law_1.01,0.23695359230041504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,4,4,power_law_1.01,0.16179200410842895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,4,4,power_law_1.01,0.27381761074066163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,1,balanced,7.6641279856363935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,4,4,power_law_1.01,0.2795520067214966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,4,4,power_law_1.01,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,4,4,power_law_1.01,0.2885632038116455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,4,4,power_law_1.01,0.29184000492095946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,4,4,power_law_1.01,0.29224960803985595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,4,4,power_law_1.01,0.30126080513000486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,4,4,power_law_1.01,0.3112895965576172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,4,4,power_law_1.01,0.314572811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,1,balanced,9.183061599731445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,4,4,power_law_1.01,0.3235840082168579
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,4,4,power_law_1.01,0.36945281028747556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,4,4,power_law_1.01,0.3952640056610107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,4,4,power_law_1.01,0.4558847904205322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,4,4,power_law_1.01,0.4573184013366699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,1,balanced,12.312917073567709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,4,4,power_law_1.01,0.5500927925109863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,4,4,power_law_1.01,0.7331840038299561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,1,balanced,14.981632232666016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,4,4,power_law_1.01,0.9766847610473632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,1,balanced,21.296794891357422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,4,4,power_law_1.01,1.3172608375549317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,1,balanced,27.4431889851888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,4,4,power_law_1.01,1.820262336730957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,4,4,power_law_1.01,2.188083267211914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,1,power_law_1.2,28.239053344726564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,4,4,power_law_1.01,3.5778560638427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,4,4,power_law_1.01,4.135526275634765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,4,power_law_1.2,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,4,power_law_1.2,0.2871295928955078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,4,power_law_1.2,0.4249472141265869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,4,power_law_1.2,0.4923391819000244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,4,power_law_1.2,0.7350272178649903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,4,power_law_1.2,0.879206371307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,4,power_law_1.2,1.0217215538024902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,4,power_law_1.2,1.2752896308898927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,2,2,power_law_1.2,0.5578752040863038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,2,2,power_law_1.2,0.8241151809692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,4,power_law_1.2,1.3529088020324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,2,2,power_law_1.2,1.277952003479004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,4,power_law_1.2,1.386291217803955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,2,2,power_law_1.2,1.7770496368408204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,4,power_law_1.2,1.2263423919677734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,4,power_law_1.2,1.3451264381408692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,4,power_law_1.2,1.195622444152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,2,2,power_law_1.2,1.6977920532226562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,4,power_law_1.2,1.2511232376098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,2,2,power_law_1.2,1.7944576263427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,4,power_law_1.2,1.3137920379638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,2,2,power_law_1.2,1.8165760040283203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,4,power_law_1.2,1.3125375747680663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,2,2,power_law_1.2,2.178867149353027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,4,power_law_1.2,1.4809087753295898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,2,2,power_law_1.2,2.4014848709106444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,4,power_law_1.2,1.5474687576293946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,2,2,power_law_1.2,2.397593688964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,4,power_law_1.2,1.6166912078857423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,2,2,power_law_1.2,2.28720645904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,4,power_law_1.2,1.866534423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,2,2,power_law_1.2,2.4559616088867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,4,power_law_1.2,1.987788772583008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,2,2,power_law_1.2,2.630860710144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,4,power_law_1.2,2.3123968124389647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,2,2,power_law_1.2,3.015065574645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,4,power_law_1.2,2.7639808654785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,2,2,power_law_1.2,3.240755081176758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,4,power_law_1.2,3.7711872100830077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,4,4,power_law_1.01,5.4411262512207035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,2,2,power_law_1.2,3.606732940673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,4,power_law_1.2,4.271680068969727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,2,2,power_law_1.2,4.4269569396972654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,4,power_law_1.2,6.115110397338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,2,2,power_law_1.2,5.3346305847167965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,4,power_law_1.2,7.033241271972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,2,2,power_law_1.2,6.4538627624511715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,2,2,power_law_1.2,7.879673767089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,4,4,power_law_1.01,7.990681457519531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,2,2,power_law_1.2,8.89917449951172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,2,2,power_law_1.2,12.081766510009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,128,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,128,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,128,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,128,power_law_1.01,0.05568640232086182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,128,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,128,power_law_1.01,0.057548797130584715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,128,power_law_1.01,0.05816320180892944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,128,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,128,power_law_1.01,0.06079999804496765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,128,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,128,power_law_1.01,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,128,power_law_1.01,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,128,power_law_1.01,0.0694271981716156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,128,power_law_1.01,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,128,power_law_1.01,0.08294399976730346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,128,power_law_1.01,0.09154559969902039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,128,power_law_1.01,0.10649600028991699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,128,power_law_1.01,0.1615872025489807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,128,power_law_1.01,0.22323200702667237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,128,power_law_1.01,0.30801920890808104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,128,power_law_1.01,0.3579904079437256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,128,power_law_1.01,0.5281792163848877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,128,power_law_1.01,0.7741439819335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,128,power_law_1.01,1.1638784408569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,128,power_law_1.01,1.56692476272583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,128,power_law_1.01,2.371583938598633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,128,power_law_1.01,2.917580795288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,2,2,power_law_1.2,14.313063049316407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,2,2,power_law_1.2,18.898739624023438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,16,8,power_law_1.2,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,16,8,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,16,8,power_law_1.2,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,16,8,power_law_1.2,0.06264320015907288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,16,8,power_law_1.2,0.08847360014915466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,16,8,power_law_1.2,0.14970879554748534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,16,8,power_law_1.2,0.16773120164871216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,16,8,power_law_1.2,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,16,8,power_law_1.2,0.14725120067596437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,16,8,power_law_1.2,0.16383999586105347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,16,8,power_law_1.2,0.15400960445404052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,16,8,power_law_1.2,0.157043194770813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,16,8,power_law_1.2,0.17838079929351808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,16,8,power_law_1.2,0.21401600837707518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,16,8,power_law_1.2,0.22917120456695556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,16,8,power_law_1.2,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,16,8,power_law_1.2,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,16,8,power_law_1.2,0.3000319957733154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,16,8,power_law_1.2,0.32972800731658936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,128,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,128,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,16,8,power_law_1.2,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,128,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,16,8,power_law_1.2,0.46611838340759276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,128,power_law_1.2,0.03031040132045746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,16,8,power_law_1.2,0.6072319984436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,128,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,128,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,128,power_law_1.2,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,16,8,power_law_1.2,0.8720383644104004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,128,power_law_1.2,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,128,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,128,power_law_1.2,0.03256320059299469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,16,8,power_law_1.2,1.326899242401123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,128,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,128,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,128,power_law_1.2,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,128,power_law_1.2,0.036447998881340024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,16,8,power_law_1.2,1.847091293334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,128,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,128,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,128,power_law_1.2,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,128,power_law_1.2,0.06348800063133239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,128,power_law_1.2,0.08028159737586975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,16,8,power_law_1.2,2.7623424530029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,128,power_law_1.2,0.12042239904403687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,128,power_law_1.2,0.17018879652023317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,128,power_law_1.2,0.32522239685058596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,16,8,power_law_1.2,3.835481643676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,128,power_law_1.2,0.4444159984588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,2,2,power_law_1.2,22.583705139160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,128,power_law_1.2,0.6948863983154296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,128,power_law_1.2,0.9168895721435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,2,2,power_law_1.2,28.404327392578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,128,power_law_1.2,1.6109567642211915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,1,2,balanced,0.2577066620190938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,1,2,balanced,0.45431466897328693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,1,2,balanced,0.8767146269480387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,1,2,balanced,1.718272050221761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,1,2,balanced,3.397973378499349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,1,2,balanced,3.406165440877279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,1,2,balanced,3.4129918416341147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,1,2,balanced,3.42083740234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,1,2,balanced,3.4297173817952475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,1,2,balanced,3.4375413258870444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,1,2,balanced,3.4578774770100913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,1,2,balanced,3.4870611826578775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,1,2,balanced,3.5124905904134116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,1,2,balanced,3.5590826670328775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,1,2,balanced,3.6573867797851562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,1,2,balanced,3.6826454798380532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,1,2,balanced,3.731781323750814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,128,power_law_1.2,2.1399551391601563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,1,2,balanced,3.813546816507975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,1,2,balanced,4.038997332255046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,1,2,balanced,4.0635732014973955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,1,2,balanced,4.120917320251465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,1,2,balanced,4.536490758260091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,1,2,balanced,4.916223843892415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,1,2,balanced,6.17898686726888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,1,2,balanced,7.4496002197265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,2,2,power_law_1.2,36.557003784179685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,1,2,balanced,10.727755228678385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,1,2,balanced,14.073173522949219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,2,power_law_1.01,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,2,power_law_1.01,0.025798401236534117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,2,power_law_1.01,0.02805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,2,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,2,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,2,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,2,power_law_1.01,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,2,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,2,power_law_1.01,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,2,power_law_1.01,0.039904001355171206
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,2,power_law_1.01,0.04154880046844482
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,2,power_law_1.01,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,2,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,2,power_law_1.01,0.05117440223693848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,2,power_law_1.01,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,1,power_law_1.01,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,2,power_law_1.01,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,1,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,2,power_law_1.01,0.07598080039024353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,1,power_law_1.01,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,2,power_law_1.01,0.11038080453872681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,1,power_law_1.01,0.16568319797515868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,2,power_law_1.01,0.17489919662475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,1,power_law_1.01,0.25026559829711914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,2,power_law_1.01,0.2336575984954834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,1,power_law_1.01,0.38727679252624514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,2,power_law_1.01,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,1,power_law_1.01,0.41000962257385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,2,power_law_1.01,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,1,power_law_1.01,0.4282368183135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,1,power_law_1.01,0.4395008087158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,2,power_law_1.01,0.4902912139892578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,1,power_law_1.01,0.4442111968994141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,2,power_law_1.01,0.7780352115631104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,1,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,1,power_law_1.01,0.47759361267089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,2,power_law_1.01,1.0522432327270508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,1,power_law_1.01,0.49745922088623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,1,power_law_1.01,0.5068799972534179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,2,power_law_1.01,1.6744447708129884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,1,power_law_1.01,0.5255167961120606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,1,power_law_1.01,0.5599232196807862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,1,power_law_1.01,0.610918378829956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,2,power_law_1.01,2.088345527648926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,1,power_law_1.01,0.66211838722229
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,1,power_law_1.01,0.7434239864349366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,1,power_law_1.01,0.9422783851623535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,1,power_law_1.01,1.1606016159057617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,1,power_law_1.01,1.5818752288818358
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,1,power_law_1.01,1.962393569946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,1,power_law_1.01,2.735296058654785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,1,power_law_1.01,3.560038375854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,1,power_law_1.01,5.30780143737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,1,power_law_1.01,7.071743774414062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,8,1,power_law_1.01,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,8,1,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,8,1,power_law_1.01,0.11816960573196411
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,8,1,power_law_1.01,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,8,1,power_law_1.01,0.2707263946533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,8,1,power_law_1.01,0.278931188583374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,8,1,power_law_1.01,0.28384640216827395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,8,1,power_law_1.01,0.2852864027023315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,8,1,power_law_1.01,0.28774399757385255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,8,1,power_law_1.01,0.28282880783081055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,8,1,power_law_1.01,0.30023679733276365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,8,1,power_law_1.01,0.3014656066894531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,8,1,power_law_1.01,0.30023679733276365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,8,1,power_law_1.01,0.29511680603027346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,8,1,power_law_1.01,0.3078144073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,8,1,power_law_1.01,0.3135488033294678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,8,1,power_law_1.01,0.33075199127197263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,8,1,power_law_1.01,0.3825664043426514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,8,1,power_law_1.01,0.45342721939086916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,8,1,power_law_1.01,0.5855231761932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,8,1,power_law_1.01,0.6807551860809327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,8,1,power_law_1.01,1.0061823844909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,8,1,power_law_1.01,1.274662399291992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,1,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,1,power_law_1.2,0.18818559646606445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,1,power_law_1.2,0.3477504014968872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,1,power_law_1.2,0.6062079906463623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,1,power_law_1.2,0.8859647750854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,8,1,power_law_1.01,1.946009635925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,1,power_law_1.2,1.2519424438476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,1,power_law_1.2,1.7897472381591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,1,power_law_1.2,1.9494911193847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,1,power_law_1.2,1.9912448883056642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,1,power_law_1.2,2.089779281616211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,1,power_law_1.2,2.1495807647705076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,1,power_law_1.2,2.277561569213867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,1,power_law_1.2,2.29355525970459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,1,power_law_1.2,2.3773183822631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,1,power_law_1.2,2.4229888916015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,1,power_law_1.2,2.4098432540893553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,1,power_law_1.2,2.6609344482421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,1,power_law_1.2,2.7860992431640623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,8,1,power_law_1.01,2.6193920135498048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,1,power_law_1.2,2.9212671279907227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,1,power_law_1.2,3.1688703536987304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,1,power_law_1.2,3.3279998779296873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,1,power_law_1.2,3.8909950256347656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,1,power_law_1.2,4.348908615112305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,1,power_law_1.2,5.5119873046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,1,power_law_1.2,6.372966384887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,1,power_law_1.2,8.665293121337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,1,power_law_1.2,10.839839935302734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,8,1,power_law_1.01,4.037017440795898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,32,1,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,32,1,power_law_1.01,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,32,1,power_law_1.01,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,32,1,power_law_1.01,0.12369920015335083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,32,1,power_law_1.01,0.264192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,32,1,power_law_1.01,0.3713023900985718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,32,1,power_law_1.01,0.43765759468078613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,32,1,power_law_1.01,0.5591040134429932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,32,1,power_law_1.01,0.5951488018035889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,32,1,power_law_1.01,0.6219776153564454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,32,1,power_law_1.01,0.6459199905395507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,32,1,power_law_1.01,0.685260820388794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,32,1,power_law_1.01,0.7127039909362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,32,1,power_law_1.01,0.7970816135406494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,32,1,power_law_1.01,0.8113856315612793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,32,1,power_law_1.01,0.8556544303894043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,32,1,power_law_1.01,0.9252863883972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,32,1,power_law_1.01,1.093836784362793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,32,1,power_law_1.01,1.2484607696533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,8,1,power_law_1.01,5.331763076782226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,32,1,power_law_1.01,1.618124771118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,32,1,power_law_1.01,1.9519487380981446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,32,1,power_law_1.01,2.6382144927978515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,32,1,power_law_1.01,3.313228988647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,32,1,power_law_1.01,4.719001770019531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,32,1,power_law_1.01,6.171648025512695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,32,1,power_law_1.01,9.18116455078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,32,1,power_law_1.01,12.217549133300782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,64,power_law_1.01,0.4607999801635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,64,power_law_1.01,0.41390080451965333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,64,power_law_1.01,0.4128767967224121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,64,power_law_1.01,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,64,power_law_1.01,0.38932480812072756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,64,power_law_1.01,0.34037759304046633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,64,power_law_1.01,0.3299328088760376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,64,power_law_1.01,0.3956736087799072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,64,power_law_1.01,0.397107195854187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,64,power_law_1.01,0.37150719165802004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,64,power_law_1.01,0.4005887985229492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,64,power_law_1.01,0.3772416114807129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,1,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,1,balanced,0.2532693346341451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,64,power_law_1.01,0.37908480167388914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,1,balanced,0.46694401899973553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,1,balanced,0.4657493432362874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,1,balanced,0.4679679870605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,64,power_law_1.01,0.4233215808868408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,1,balanced,0.47257598241170246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,1,balanced,0.475818673769633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,64,power_law_1.01,0.41984000205993655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,1,balanced,0.4792319933573405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,1,balanced,0.4851786692937215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,64,power_law_1.01,0.40712318420410154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,1,balanced,0.48742401599884033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,1,balanced,0.4939093192418416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,64,power_law_1.01,0.4206592082977295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,1,balanced,0.5099519888559977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,1,balanced,0.5157546599706014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,64,power_law_1.01,0.46981120109558105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,1,balanced,0.5169493357340494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,1,balanced,0.5435733397801717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,1,balanced,0.5630186796188354
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,64,power_law_1.01,0.4980735778808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,1,balanced,0.5468159914016724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,1,balanced,0.6217386722564697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,64,power_law_1.01,0.5720064163208007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,1,balanced,0.6613333225250244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,1,balanced,0.823637326558431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,64,power_law_1.01,0.6547455787658691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,1,balanced,1.047381321589152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,64,power_law_1.01,0.7747583866119385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,1,balanced,1.5655253728230794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,1,balanced,2.1017600695292153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,64,power_law_1.01,0.8474623680114746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,1,balanced,3.1754239400227866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,64,power_law_1.01,1.3445119857788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,64,power_law_1.01,1.7483776092529297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,1,balanced,4.210858662923177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,64,power_law_1.01,2.609766387939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,1,balanced,6.345898946126302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,64,power_law_1.01,3.2131072998046877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,1,balanced,8.385706583658854
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,8,balanced,0.5167786677678426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,8,balanced,0.4572106599807739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,8,balanced,0.4614826838175456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,8,balanced,0.4681386550267537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,8,balanced,0.4643839995066325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,8,balanced,0.46745598316192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,8,balanced,0.47035733858744305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,8,balanced,0.4720640182495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,8,balanced,0.47411199410756427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,8,balanced,0.4775253136952718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,8,balanced,0.4819626808166504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,8,balanced,0.4858880043029785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,8,balanced,0.48742401599884033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,8,balanced,0.5130240122477213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,8,balanced,0.5521066586176554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,8,balanced,0.5599573453267416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,8,balanced,0.5478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,8,balanced,0.9321813583374023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,8,balanced,0.9285973707834879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,8,balanced,1.3487787246704102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,8,balanced,1.733290672302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,8,balanced,2.553343931833903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,8,balanced,3.2742398579915366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,8,balanced,4.6484479904174805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,8,balanced,5.835093180338542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,8,balanced,7.88650639851888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,8,balanced,9.620138804117838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,4,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,4,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,4,balanced,0.17254400253295898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,4,balanced,0.3964586655298869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,4,balanced,0.7096319993336996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,4,balanced,0.9424213568369547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,4,balanced,0.9456640084584554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,4,balanced,0.9475413163503011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,4,balanced,0.9492479960123698
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,4,balanced,0.9523200194040934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,4,balanced,0.9564159711201986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,4,balanced,0.9610239664713541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,4,balanced,0.964949369430542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,4,balanced,0.9712639649709066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,4,balanced,0.9794399738311768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,4,balanced,0.9861120382944742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,4,balanced,0.9975466728210449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,4,balanced,1.0105173587799072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,4,balanced,1.0284372965494792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,4,balanced,1.0516479810078938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,4,balanced,1.0915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,4,balanced,1.2101973692576091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,4,balanced,1.263445297876994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,4,balanced,1.5349706013997395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,4,balanced,1.6851627031962078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,4,balanced,2.3181653022766113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,4,balanced,2.8629334767659507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,1,8,power_law_1.2,0.9066495895385742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,1,8,power_law_1.2,0.9027584075927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,1,8,power_law_1.2,0.9011199951171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,1,8,power_law_1.2,0.9039872169494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,1,8,power_law_1.2,0.9064448356628418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,1,8,power_law_1.2,0.9312255859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,1,8,power_law_1.2,1.4024703979492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,1,8,power_law_1.2,1.5431679725646972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,1,8,power_law_1.2,1.8202367782592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,1,8,power_law_1.2,2.087526321411133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,1,32,balanced,0.022341333329677582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,1,32,balanced,0.02165866643190384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,1,32,balanced,0.021669333179791767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,1,32,balanced,0.022015998760859173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,1,32,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,1,32,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,1,32,balanced,0.0240639994541804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,1,32,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,1,32,balanced,0.024234667420387268
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,1,8,power_law_1.2,1.7805183410644532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,1,32,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,1,32,balanced,0.025253333151340485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,1,32,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,1,32,balanced,0.025744001070658367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,1,32,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,1,32,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,1,32,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,1,32,balanced,0.031888000667095184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,1,32,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,1,32,balanced,0.03822933385769526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,1,32,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,1,32,balanced,0.05563733478387197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,1,8,power_law_1.2,2.254233551025391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,1,32,balanced,0.08992000420888265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,1,32,balanced,0.0962559978167216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,1,32,balanced,0.1418239971001943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,1,32,balanced,0.16571733355522156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,1,32,balanced,0.3027626673380534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,1,8,power_law_1.2,2.3824384689331053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,1,32,balanced,0.39560532569885254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,1,8,power_law_1.2,2.8180479049682616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,1,8,power_law_1.2,3.704217529296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,1,8,power_law_1.2,3.9639041900634764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,1,8,power_law_1.2,4.899430465698242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,1,8,power_law_1.2,7.878246307373047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,1,8,power_law_1.2,10.774527740478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,1,8,power_law_1.2,13.774234008789062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,32,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,32,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,32,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,32,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,32,balanced,0.06195199986298879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,32,balanced,0.20821332931518555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,32,balanced,0.20889600118001303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,32,balanced,0.21094399690628052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,32,balanced,0.21230934063593546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,32,balanced,0.21384533246358237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,32,balanced,0.21691733598709106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,32,balanced,0.21913599967956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,32,balanced,0.2208426594734192
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,32,balanced,0.22562134265899658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,32,balanced,0.2302293380101522
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,32,balanced,0.23637332518895468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,32,balanced,0.24438399076461792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,32,balanced,0.2650453249613444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,32,balanced,0.2870560089747111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,32,balanced,0.32443199555079144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,32,balanced,0.35703468322753906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,32,balanced,0.42239999771118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,32,balanced,0.482474684715271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,32,balanced,0.6546719868977865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,32,balanced,0.7975253264109293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,1,8,power_law_1.2,18.3552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,32,balanced,1.241429328918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,32,balanced,1.664511998494466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,1,8,power_law_1.2,22.41126403808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,1,8,power_law_1.2,26.476947021484374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,16,power_law_1.01,0.4374527931213379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,16,power_law_1.01,0.5574656009674073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,16,power_law_1.01,0.5353472232818604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,16,power_law_1.01,0.5494783878326416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,16,power_law_1.01,0.5550079822540284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,16,power_law_1.01,0.51179518699646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,16,power_law_1.01,0.4808640003204346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,16,power_law_1.01,0.5081088066101074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,16,power_law_1.01,0.48046078681945803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,16,power_law_1.01,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,16,power_law_1.01,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,16,power_law_1.01,0.5335040092468262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,16,power_law_1.01,0.5062655925750732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,16,power_law_1.01,0.5361663818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,16,power_law_1.01,0.5478400230407715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,16,power_law_1.01,0.577126407623291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,16,power_law_1.01,0.580403184890747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,16,power_law_1.01,0.6338560104370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,16,power_law_1.01,0.6746111869812011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,16,power_law_1.01,0.777184009552002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,16,power_law_1.01,0.8460288047790527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,16,power_law_1.01,1.06496000289917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,16,power_law_1.01,1.1835136413574219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,16,power_law_1.01,1.7897472381591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,16,power_law_1.01,2.2167552947998046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,16,power_law_1.01,3.2307201385498048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,1,8,power_law_1.2,34.50613708496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,16,power_law_1.01,4.278476715087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,8,power_law_1.01,0.6051839828491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,8,power_law_1.01,1.0711039543151855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,8,power_law_1.01,1.4872575759887696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,8,power_law_1.01,1.5839232444763183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,8,power_law_1.01,1.4536704063415526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,4,balanced,0.021162666380405426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,4,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,4,balanced,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,4,balanced,0.024405332903067272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,4,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,4,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,4,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,4,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,8,power_law_1.01,1.6283647537231445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,4,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,4,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,4,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,4,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,4,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,4,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,4,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,4,balanced,0.04164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,4,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,4,balanced,0.056661332647005715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,8,power_law_1.01,1.8259647369384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,4,balanced,0.06980266670385997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,4,balanced,0.11366400122642517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,4,balanced,0.17493333419164023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,4,balanced,0.21964800357818604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,4,balanced,0.23688532908757529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,8,power_law_1.01,1.8049024581909179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,4,balanced,0.3916693528493245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,4,balanced,0.5806080102920532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,8,power_law_1.01,1.8325504302978515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,4,balanced,0.9970346291859945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,8,power_law_1.01,1.7002496719360352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,4,balanced,1.3388800621032715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,8,power_law_1.01,1.7135616302490235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,8,power_law_1.01,1.8687936782836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,8,power_law_1.01,1.7881088256835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,8,power_law_1.01,1.9756799697875977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,8,power_law_1.01,1.9494911193847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,8,power_law_1.01,1.9597312927246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,8,power_law_1.01,1.9720191955566406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,8,power_law_1.01,2.317888069152832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,8,power_law_1.01,2.1608255386352537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,8,power_law_1.01,2.448761558532715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,8,power_law_1.01,2.6710016250610353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,8,power_law_1.01,2.976358413696289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,8,power_law_1.01,3.4791423797607424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,32,power_law_1.01,0.6012928009033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,32,power_law_1.01,0.7909376144409179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,8,power_law_1.01,4.698112106323242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,32,power_law_1.01,0.7880703926086425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,32,power_law_1.01,0.7882751941680908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,8,power_law_1.01,4.9934337615966795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,32,power_law_1.01,0.7888895988464355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,32,power_law_1.01,0.6846464157104493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,32,power_law_1.01,0.6727680206298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,32,power_law_1.01,0.7723008155822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,8,power_law_1.01,6.903193664550781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,32,power_law_1.01,0.7315455913543701
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,32,power_law_1.01,0.7569407939910888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,32,power_law_1.01,0.7006207942962647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,32,power_law_1.01,0.7221248149871826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,8,power_law_1.01,9.538764953613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,32,power_law_1.01,0.6918144226074219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,32,power_law_1.01,0.7706624031066894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,32,power_law_1.01,0.7665664196014405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,32,power_law_1.01,0.7317503929138184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,32,power_law_1.01,0.7516160011291504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,32,power_law_1.01,0.8730624198913575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,32,power_law_1.01,0.8390656471252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,32,power_law_1.01,0.9439231872558593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,32,power_law_1.01,0.9945088386535644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,1,8,power_law_1.2,39.58476867675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,32,power_law_1.01,1.2130304336547852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,32,power_law_1.01,1.3932543754577638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,32,power_law_1.01,1.962803268432617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,32,power_law_1.01,2.5049087524414064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,32,power_law_1.01,3.384320068359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,32,power_law_1.01,4.62663688659668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,16,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,16,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,16,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,16,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,16,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,16,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,16,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,16,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,16,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,16,power_law_1.2,0.03091199994087219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,16,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,16,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,16,power_law_1.2,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,16,power_law_1.2,0.04688639938831329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,16,power_law_1.2,0.04689919948577881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,16,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,16,power_law_1.2,0.06533120274543762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,16,power_law_1.2,0.0741312026977539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,16,power_law_1.2,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,16,power_law_1.2,0.11284480094909669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,16,power_law_1.2,0.21811199188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,16,power_law_1.2,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,16,power_law_1.2,0.41656317710876467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,16,power_law_1.2,0.5345151901245118
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,16,power_law_1.2,0.8607744216918946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,16,power_law_1.2,1.2677120208740233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,1,8,power_law_1.2,50.95628662109375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,1,8,power_law_1.2,64.94187622070312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,4,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,4,balanced,0.28413333495457965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,4,balanced,0.5531306664148966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,4,balanced,1.0615466435750325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,4,balanced,2.0273280143737793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,4,balanced,4.138154665629069
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,4,balanced,4.150783856709798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,4,balanced,3.988821347554525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,4,balanced,3.9983787536621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,4,balanced,4.006058692932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,4,balanced,4.021077473958333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,4,balanced,4.0367787679036455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,4,balanced,4.0478560129801435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,4,balanced,4.073301315307617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,4,balanced,4.105898539225261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,4,balanced,4.126207987467448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,4,balanced,4.167999903361003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,4,balanced,4.24891726175944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,4,balanced,4.332031885782878
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,4,balanced,4.479488054911296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,4,balanced,4.646229426066081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,4,balanced,5.058901468912761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,4,balanced,5.257216135660808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,4,balanced,5.706410725911458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,4,balanced,6.469120025634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,4,balanced,8.482133229573568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,4,balanced,10.6878293355306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,2,128,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,2,128,balanced,0.053077335158983864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,2,128,balanced,0.05323733389377594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,2,128,balanced,0.06724266707897186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,2,128,balanced,0.053247998158137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,2,128,balanced,0.056320001681645714
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,2,128,balanced,0.05734399954477946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,2,128,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,2,128,balanced,0.05836800237496694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,2,128,balanced,0.06382933259010315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,2,128,balanced,0.05922133227189382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,2,128,balanced,0.06604800124963124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,2,128,balanced,0.06229333579540253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,2,128,balanced,0.06809600194295247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,2,128,balanced,0.07150933146476746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,2,128,balanced,0.07236266632874806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,2,128,balanced,0.0773119976123174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,2,128,balanced,0.1088853379090627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,2,128,balanced,0.1430186629295349
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,2,128,balanced,0.1904639999071757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,2,128,balanced,0.21384533246358237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,2,128,balanced,0.253440002600352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,2,128,balanced,0.3092479904492696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,2,128,balanced,0.42393600940704346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,2,128,balanced,0.5183146794637045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,2,128,balanced,0.7205546696980795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,2,128,balanced,0.942080020904541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,128,power_law_1.01,0.2541568040847778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,128,power_law_1.01,0.22915201187133788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,128,power_law_1.01,0.22855679988861083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,128,power_law_1.01,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,128,power_law_1.01,0.23057279586791993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,128,power_law_1.01,0.19804160594940184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,128,power_law_1.01,0.20087039470672607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,128,power_law_1.01,0.235315203666687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,128,power_law_1.01,0.23592960834503174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,128,power_law_1.01,0.23756160736083984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,128,power_law_1.01,0.24204161167144775
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,128,power_law_1.01,0.2451456069946289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,128,power_law_1.01,0.2471935987472534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,128,power_law_1.01,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,128,power_law_1.01,0.2396159887313843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,128,power_law_1.01,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,128,power_law_1.01,0.2795520067214966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,128,power_law_1.01,0.3151871919631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,128,power_law_1.01,0.32071681022644044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,128,power_law_1.01,0.39813120365142823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,128,power_law_1.01,0.4444159984588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,128,power_law_1.01,0.6037312030792237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,128,power_law_1.01,0.7555071830749511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,128,power_law_1.01,1.1722432136535645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,128,power_law_1.01,1.6207872390747071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,128,power_law_1.01,2.4631296157836915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,128,power_law_1.01,3.1022975921630858
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,4,16,power_law_1.2,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,4,16,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,4,16,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,4,16,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,4,16,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,4,16,power_law_1.2,0.03501439988613129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,4,16,power_law_1.2,0.03583360016345978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,4,16,power_law_1.2,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,128,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,4,16,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,128,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,4,16,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,4,16,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,128,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,4,16,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,128,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,4,16,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,4,16,power_law_1.2,0.0536575973033905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,128,power_law_1.01,0.034815999865531924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,4,16,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,128,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,4,16,power_law_1.2,0.06963199973106385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,4,16,power_law_1.2,0.08622080087661743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,128,power_law_1.01,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,128,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,4,16,power_law_1.2,0.11079679727554322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,128,power_law_1.01,0.03706879913806915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,4,16,power_law_1.2,0.1521664023399353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,4,16,power_law_1.2,0.23019518852233886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,4,16,power_law_1.2,0.2850816011428833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,4,16,power_law_1.2,0.39628798961639405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,128,power_law_1.01,0.037273600697517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,128,power_law_1.01,0.038073599338531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,128,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,128,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,128,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,128,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,128,power_law_1.01,0.04503040015697479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,128,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,128,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,128,power_law_1.01,0.06775680184364319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,4,16,power_law_1.2,0.5191679954528808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,128,power_law_1.01,0.08478720188140869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,128,power_law_1.01,0.10936319828033447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,128,power_law_1.01,0.14909440279006958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,128,power_law_1.01,0.1755136013031006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,128,power_law_1.01,0.34856960773468015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,128,power_law_1.01,0.45854721069335935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,128,power_law_1.01,0.6881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,128,power_law_1.01,0.963379192352295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,4,16,power_law_1.2,0.923033618927002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,4,16,power_law_1.2,1.3737919807434082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,8,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,8,power_law_1.01,0.04320639967918396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,8,power_law_1.01,0.04298880100250244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,8,power_law_1.01,0.04524799883365631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,8,power_law_1.01,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,8,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,8,power_law_1.01,0.045875200629234315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,8,power_law_1.01,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,8,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,8,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,8,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,8,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,8,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,8,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,8,power_law_1.01,0.05857279896736145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,8,power_law_1.01,0.06389759778976441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,8,power_law_1.01,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,8,power_law_1.01,0.08744959831237793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,8,power_law_1.01,0.13824000358581542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,8,power_law_1.01,0.17776639461517335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,8,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,8,power_law_1.01,0.3704832077026367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,8,power_law_1.01,0.522649621963501
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,8,power_law_1.01,0.7610367774963379
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,4,16,power_law_1.2,1.8329599380493165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,8,power_law_1.01,1.172480010986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,8,power_law_1.01,1.6132095336914063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,8,power_law_1.2,0.3463167905807495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,8,power_law_1.2,0.3540992021560669
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,8,power_law_1.2,0.4986879825592041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,8,power_law_1.2,0.5042175769805908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,8,power_law_1.2,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,8,power_law_1.2,0.6236159801483154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,8,power_law_1.2,0.6262784004211426
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,8,power_law_1.2,0.6344704151153564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,8,power_law_1.2,0.6393856048583985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,8,power_law_1.2,0.6813695907592774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,8,power_law_1.2,0.6948736190795899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,8,power_law_1.2,0.664358377456665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,8,power_law_1.2,0.7186431884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,8,power_law_1.2,0.6957056045532226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,8,power_law_1.2,0.7573503971099853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,8,power_law_1.2,0.7729152202606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,8,power_law_1.2,0.7962624073028565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,8,power_law_1.2,0.8366080284118652
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,8,power_law_1.2,0.901734447479248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,8,power_law_1.2,0.9904128074645996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,8,power_law_1.2,1.2210176467895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,8,power_law_1.2,1.602764892578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,8,power_law_1.2,2.028134346008301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,8,power_law_1.2,3.059712028503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,8,power_law_1.2,3.3511425018310548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,8,power_law_1.2,5.087231826782227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,8,power_law_1.2,6.933094024658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,4,16,power_law_1.2,2.689228820800781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,16,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,16,balanced,0.025770666698614757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,16,balanced,0.0266239990790685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,16,balanced,0.026789332429567974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,16,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,16,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,16,balanced,0.028832000990708668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,16,balanced,0.02916266769170761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,16,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,16,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,16,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,16,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,16,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,16,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,16,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,16,balanced,0.04181333382924398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,16,balanced,0.04539733131726583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,16,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,16,balanced,0.06348800162474315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,16,balanced,0.13567999998728433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,16,balanced,0.2249386707941691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,16,balanced,0.3278506596883138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,16,balanced,0.4437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,16,balanced,0.7009173234303793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,16,balanced,1.0007893244425456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,32,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,32,power_law_1.2,0.02271360009908676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,32,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,32,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,32,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,32,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,32,power_law_1.2,0.02414720058441162
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,32,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,32,power_law_1.2,0.024166400730609893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,32,power_law_1.2,0.024985599517822265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,32,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,32,power_law_1.2,0.025804799795150758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,32,power_law_1.2,0.027238398790359497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,32,power_law_1.2,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,32,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,32,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,32,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,32,power_law_1.2,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,32,power_law_1.2,0.0686016023159027
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,32,power_law_1.2,0.07904000282287597
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,32,power_law_1.2,0.10895359516143799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,32,power_law_1.2,0.12288000583648681
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,32,power_law_1.2,0.2781183958053589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,32,power_law_1.2,0.34344959259033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,32,power_law_1.2,0.5136191844940186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,32,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,32,balanced,0.05751466751098633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,32,balanced,0.0576853354771932
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,32,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,32,balanced,0.5486933390299479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,32,balanced,1.056938648223877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,32,balanced,1.0598399639129639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,32,balanced,1.0513066450754802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,32,balanced,1.0524906317392986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,32,balanced,1.0547093550364177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,32,balanced,1.0579626560211182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,32,balanced,1.0586453278859456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,32,balanced,1.0615466435750325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,32,balanced,1.068885326385498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,32,balanced,1.0736640294392903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,32,balanced,1.0803199609120686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,32,balanced,1.0885120232899983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,32,balanced,1.126912037531535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,32,balanced,1.1482453346252441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,32,balanced,1.173845370610555
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,32,balanced,1.2115626335144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,32,balanced,1.4344533284505208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,32,balanced,1.4861653645833333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,32,balanced,1.7829546928405762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,32,balanced,1.951914628346761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,32,balanced,2.422954718271891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,32,balanced,2.9538987477620444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,32,power_law_1.2,0.7874559879302978
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.09031680226325989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.20295679569244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.22527999877929689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.46632962226867675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.4624320030212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.48967680931091306
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.49500160217285155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.49254398345947265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.4894720077514648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.4880383968353271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.4958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.5130239963531494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.5337088108062744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.5513216018676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.5484543800354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.6119423866271972
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.7159808158874512
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.7774208068847657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.9719807624816894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,16,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,16,power_law_1.01,0.052019202709198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,16,power_law_1.01,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,16,power_law_1.01,0.048127999901771544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,16,power_law_1.01,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,16,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,16,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,16,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,16,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,16,power_law_1.01,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,1,power_law_1.2,1.2097536087036134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,16,power_law_1.01,0.04564479887485504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,16,power_law_1.01,0.0477183997631073
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,16,power_law_1.01,0.052223998308181765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,16,power_law_1.01,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,16,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,16,power_law_1.01,0.07352319955825806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,16,power_law_1.01,0.08724480271339416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,16,power_law_1.01,0.1112064003944397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,16,power_law_1.01,0.1533951997756958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,16,power_law_1.01,0.24677760601043702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,16,power_law_1.01,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,16,power_law_1.01,0.424345588684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,16,power_law_1.01,0.6129663944244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,16,power_law_1.01,0.9297920227050781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,16,power_law_1.01,1.20381441116333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,1,power_law_1.2,1.6994047164916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,8,power_law_1.2,0.43376641273498534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,8,power_law_1.2,0.5257215976715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,8,power_law_1.2,0.6637567996978759
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,8,power_law_1.2,0.7966527938842773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,8,power_law_1.2,0.9783295631408692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,8,power_law_1.2,0.9703424453735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,8,power_law_1.2,0.9701375961303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,8,power_law_1.2,0.93306884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,8,power_law_1.2,0.9394047737121582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,8,power_law_1.2,0.9871359825134277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,8,power_law_1.2,0.994099235534668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,8,power_law_1.2,1.0033151626586914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,8,power_law_1.2,1.0340352058410645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,8,power_law_1.2,1.0887040138244628
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,8,power_law_1.2,1.1143168449401855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,8,power_law_1.2,1.0704895973205566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,8,power_law_1.2,1.1249664306640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,8,power_law_1.2,1.1810815811157227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,8,power_law_1.2,1.3287424087524413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,8,power_law_1.2,1.523097610473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,1,power_law_1.2,2.210406494140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,8,power_law_1.2,1.701273536682129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,8,power_law_1.2,2.298470306396484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,8,power_law_1.2,2.3846912384033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,8,power_law_1.2,3.2063488006591796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,8,power_law_1.2,3.9022590637207033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,8,power_law_1.2,5.7466880798339846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,8,power_law_1.2,7.328358459472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,1,power_law_1.2,3.286016082763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,2,4,power_law_1.2,0.025388801097869874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,2,4,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,2,4,power_law_1.2,0.029491201043128967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,2,4,power_law_1.2,0.026419198513031004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,2,4,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,2,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,2,4,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,2,4,power_law_1.2,0.03684479892253876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,2,4,power_law_1.2,0.03685120046138764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,2,4,power_law_1.2,0.03829759955406189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,2,4,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,2,4,power_law_1.2,0.04403199851512909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,2,4,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,2,4,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,2,4,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,2,4,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,2,4,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,2,4,power_law_1.2,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,2,4,power_law_1.2,0.11735039949417114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,2,4,power_law_1.2,0.2002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,2,4,power_law_1.2,0.24576001167297362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,2,4,power_law_1.2,0.32276480197906493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,2,4,power_law_1.2,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,2,4,power_law_1.2,0.6139904022216797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,8,balanced,0.040618665516376495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,8,balanced,0.039936001102129616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,8,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,8,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,8,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,8,balanced,0.041637333730856575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,8,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,8,balanced,0.04232533276081085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,8,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,8,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,8,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,8,balanced,0.05529599885145823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,8,balanced,0.07389866809050243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,8,balanced,0.07645866771539052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,8,balanced,0.08157866696516673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,8,balanced,0.13090133666992188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,8,balanced,0.16127999623616537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,8,balanced,0.2657279968261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,8,balanced,0.3283626635869344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,8,balanced,0.4949333270390828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,8,balanced,0.6502346595128378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,1,power_law_1.2,4.382720184326172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,8,balanced,0.9622186819712321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,8,balanced,1.2921173572540283
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,8,balanced,1.9887785911560059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,8,balanced,2.6820265452067056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,2,4,power_law_1.2,0.7630847930908203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,2,4,power_law_1.2,1.4585856437683105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,1,power_law_1.2,6.394879913330078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,2,4,power_law_1.2,1.8288639068603516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,8,power_law_1.2,0.03461120128631592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,8,power_law_1.2,0.03338240087032318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,8,power_law_1.2,0.03314560055732727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,8,power_law_1.2,0.034201601147651674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,8,power_law_1.2,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,8,power_law_1.2,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,8,power_law_1.2,0.037248000502586365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,8,power_law_1.2,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,8,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,8,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,8,power_law_1.2,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,8,power_law_1.2,0.04095360040664673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,8,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,8,power_law_1.2,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,8,power_law_1.2,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,8,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,8,power_law_1.2,0.051609599590301515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,8,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,8,power_law_1.2,0.07187839746475219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,8,power_law_1.2,0.0899071991443634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,8,power_law_1.2,0.17960959672927856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,8,power_law_1.2,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,8,power_law_1.2,0.4239359855651855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,8,power_law_1.2,0.851961612701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,8,power_law_1.2,1.2007424354553222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,2,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,2,power_law_1.2,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,2,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,2,power_law_1.2,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,2,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,2,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,2,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,2,power_law_1.2,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,2,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,2,power_law_1.2,0.05017600059509277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,2,power_law_1.2,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,2,power_law_1.2,0.05611519813537598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,2,power_law_1.2,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,2,power_law_1.2,0.0686079978942871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,2,power_law_1.2,0.07864320278167725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,2,power_law_1.2,0.11509759426116943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,2,power_law_1.2,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,2,power_law_1.2,0.22445440292358398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,2,power_law_1.2,0.265011191368103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,2,power_law_1.2,0.33218560218811033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,2,power_law_1.2,0.4141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,2,power_law_1.2,0.6500351905822754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,2,power_law_1.2,1.04202241897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,2,power_law_1.2,1.4493696212768554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,2,power_law_1.2,2.1364736557006836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,8,power_law_1.2,1.7326080322265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,4,power_law_1.2,0.02682879865169525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,4,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,4,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,4,power_law_1.2,0.027404800057411194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,4,power_law_1.2,0.028467199206352232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,4,power_law_1.2,0.03358719944953918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,4,power_law_1.2,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,4,power_law_1.2,0.05281280279159546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,4,power_law_1.2,0.05321599841117859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,4,power_law_1.2,0.03850240111351013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,4,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,4,power_law_1.2,0.04157440066337585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,4,power_law_1.2,0.045465600490570066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,4,power_law_1.2,0.05240960121154785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,4,power_law_1.2,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,4,power_law_1.2,0.06737279891967773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,4,power_law_1.2,0.09236479997634887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,4,power_law_1.2,0.11612160205841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,1,power_law_1.2,8.47831039428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,4,power_law_1.2,0.17305599451065062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,2,power_law_1.2,3.041881561279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,4,power_law_1.2,0.1716223955154419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,2,power_law_1.2,4.333363342285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,4,power_law_1.2,0.29367680549621583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,4,power_law_1.2,0.3768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,4,power_law_1.01,0.06062080264091492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,4,power_law_1.01,0.06652799844741822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,4,power_law_1.01,0.18778239488601683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,4,power_law_1.01,0.2504319906234741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,4,power_law_1.01,0.32419838905334475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,4,power_law_1.01,0.36515839099884034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,4,power_law_1.01,0.4454400062561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,4,power_law_1.01,0.4716159820556641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,4,power_law_1.01,0.4980735778808594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,4,power_law_1.01,0.47165441513061523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,4,power_law_1.01,0.4472832202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,4,power_law_1.01,0.5025792121887207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,4,power_law_1.01,0.48762879371643064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,4,power_law_1.01,0.4990975856781006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,4,power_law_1.2,0.7448383808135987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,4,power_law_1.01,0.5439487934112549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,4,power_law_1.01,0.5631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,8,power_law_1.2,2.4895488739013674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,4,power_law_1.01,0.5701632022857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,4,power_law_1.01,0.6660096168518066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,4,power_law_1.01,0.7266304016113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,4,power_law_1.01,0.860159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,4,power_law_1.01,1.0342399597167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,4,power_law_1.01,1.2697600364685058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,4,power_law_1.01,1.724825668334961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,4,power_law_1.01,2.3353343963623048
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,4,power_law_1.01,2.967744064331055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,4,power_law_1.01,4.199833679199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,4,power_law_1.01,5.719449615478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,4,power_law_1.01,0.5251071929931641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,4,power_law_1.01,0.7294976234436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,4,power_law_1.01,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,4,power_law_1.01,1.0371071815490722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,4,power_law_1.01,1.0360832214355469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,4,power_law_1.01,1.0590208053588868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,4,power_law_1.01,1.0690560340881348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,4,power_law_1.01,1.0784768104553222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,4,power_law_1.01,1.220800018310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,4,power_law_1.01,1.239846420288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,4,power_law_1.01,1.3889535903930663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,4,power_law_1.01,1.7940479278564454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,4,power_law_1.01,1.8409408569335937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,4,power_law_1.01,2.0842432022094726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,4,power_law_1.01,2.5657344818115235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,4,power_law_1.01,3.2063488006591796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,4,power_law_1.01,3.6325374603271485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,4,power_law_1.01,5.114675140380859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,4,power_law_1.01,6.23554573059082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,4,power_law_1.01,7.501824188232422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,4,power_law_1.2,1.0639360427856446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,4,power_law_1.01,9.812992095947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,4,power_law_1.01,11.513651275634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,4,power_law_1.01,14.718156433105468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,4,power_law_1.2,1.3006848335266112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,4,power_law_1.2,0.0579584002494812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,4,power_law_1.2,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,4,power_law_1.2,0.3141632080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,4,power_law_1.2,0.4591616153717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,4,power_law_1.2,0.5996543884277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,4,power_law_1.2,0.7559167861938476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,4,power_law_1.2,1.0053631782531738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,4,power_law_1.2,0.8652799606323243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,4,power_law_1.2,0.9002943992614746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,4,power_law_1.2,0.8910847663879394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,4,power_law_1.2,0.8243200302124023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,4,power_law_1.2,0.9275391578674317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,4,power_law_1.2,0.941260814666748
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,4,power_law_1.2,0.9766912460327148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,4,power_law_1.2,1.0239999771118165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,4,power_law_1.2,1.0518527984619142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,4,power_law_1.2,1.0917887687683105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,4,power_law_1.2,1.176371192932129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,4,power_law_1.2,1.2621824264526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,4,power_law_1.2,1.4079999923706055
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,4,power_law_1.2,1.5269887924194336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,4,power_law_1.2,1.9308544158935548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,4,power_law_1.2,2.324070358276367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,4,power_law_1.2,2.9585407257080076
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,4,power_law_1.2,3.9530494689941404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,4,power_law_1.2,5.2111358642578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,4,power_law_1.2,6.678118133544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,4,power_law_1.01,21.194137573242188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,4,power_law_1.01,23.845683288574218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,8,balanced,0.04625066618124644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,8,balanced,0.045226668318112694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,8,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,8,balanced,0.07338666419188182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,8,balanced,0.30907734235127765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,8,balanced,0.3816106716791789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,8,balanced,0.3845119873682658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,8,balanced,0.3872426748275757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,8,balanced,0.3882666826248169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,8,balanced,0.38980265458424884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,8,balanced,0.3938986857732137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,8,balanced,0.3964586655298869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,8,balanced,0.3993599812189738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,8,balanced,0.40482131640116376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,8,balanced,0.41198933124542236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,8,balanced,0.420693318049113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,8,balanced,0.4331520001093547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,8,balanced,0.4500480095545451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,8,balanced,0.47035733858744305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,8,balanced,0.5130240122477213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,8,balanced,0.5403306484222412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,8,balanced,0.672597328821818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,8,balanced,0.8065706888834635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,8,balanced,1.170090675354004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,8,balanced,1.480533281962077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,8,balanced,2.094933350880941
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,8,balanced,2.70796807607015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,4,power_law_1.2,1.7383039474487305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,4,power_law_1.01,30.515200805664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,16,balanced,0.04607999821503957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,16,balanced,0.04897066454092661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,16,balanced,0.055125330885251365
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,16,balanced,0.31948800881703693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,16,balanced,0.4787199894587199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,16,balanced,0.5582506656646729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,16,balanced,0.560640017191569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,16,balanced,0.5589173237482706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,16,balanced,0.5613226493199667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,16,balanced,0.5635413328806559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,16,balanced,0.5657600164413452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,16,balanced,0.571733315785726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,16,balanced,0.5741226673126221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,16,balanced,0.5797546704610189
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,16,balanced,0.5886293252309164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,16,balanced,0.5939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,16,balanced,0.6055253346761068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,16,balanced,0.6150826613108317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,16,balanced,0.6381226778030396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,16,balanced,0.6952959696451823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,16,balanced,0.7458133697509766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,16,balanced,0.8581120173136393
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,16,balanced,0.9644373257954916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,16,balanced,1.3213013013203938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,16,balanced,1.6561493873596191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,16,balanced,2.187605381011963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,16,balanced,2.7453438440958657
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,4,power_law_1.01,35.708108520507814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,4,power_law_1.2,1.6236543655395508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,4,power_law_1.2,2.0930559158325197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,4,power_law_1.2,2.9509632110595705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,4,power_law_1.2,3.5690494537353517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,4,power_law_1.2,4.953907012939453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,4,power_law_1.2,7.382630157470703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,4,power_law_1.2,6.783795166015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,4,power_law_1.2,6.85322265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,4,power_law_1.2,6.827008056640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,4,power_law_1.2,7.142809295654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,4,power_law_1.2,7.200358581542969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,4,power_law_1.2,7.52332763671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,4,power_law_1.2,8.009318542480468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,4,power_law_1.2,8.14940185546875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,32,4,power_law_1.2,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,32,4,power_law_1.2,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,32,4,power_law_1.2,0.06041600108146668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,32,4,power_law_1.2,0.0673792004585266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,32,4,power_law_1.2,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,4,power_law_1.2,8.270438385009765
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,32,4,power_law_1.2,0.10629119873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,32,4,power_law_1.2,0.10362880229949951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,32,4,power_law_1.2,0.15994880199432374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,32,4,power_law_1.2,0.1644544005393982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,32,4,power_law_1.2,0.16752640008926392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,32,4,power_law_1.2,0.1978368043899536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,32,4,power_law_1.2,0.20848000049591064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,32,4,power_law_1.2,0.19251199960708618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,32,4,power_law_1.2,0.23101439476013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,4,power_law_1.2,8.577638244628906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,32,4,power_law_1.2,0.2461695909500122
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,32,4,power_law_1.2,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,32,4,power_law_1.2,0.2668544054031372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,32,4,power_law_1.2,0.3258368015289307
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,32,4,power_law_1.2,0.374783992767334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,32,4,power_law_1.2,0.4892672061920166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,32,4,power_law_1.2,0.638976001739502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,4,power_law_1.2,8.757862091064453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,32,4,power_law_1.2,0.9746432304382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,32,4,power_law_1.2,1.3469568252563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,4,power_law_1.2,8.767897796630859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,32,4,power_law_1.2,1.9052543640136719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,4,power_law_1.2,9.223577880859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,32,4,power_law_1.2,2.85982723236084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,4,power_law_1.2,9.543885040283204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,32,4,power_law_1.2,3.6640766143798826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,4,power_law_1.2,10.66455078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,4,power_law_1.2,12.686131286621094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,32,4,power_law_1.2,5.190041732788086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,4,power_law_1.2,12.853861999511718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,4,power_law_1.2,16.07208251953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,8,32,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,8,32,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,8,32,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,8,32,power_law_1.01,0.05713919997215271
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,8,32,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,8,32,power_law_1.01,0.05875200033187866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,4,power_law_1.2,19.67595520019531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,8,32,power_law_1.01,0.05854719877243042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,8,32,power_law_1.01,0.05734400153160095
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,8,32,power_law_1.01,0.05775359869003296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,8,32,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,8,32,power_law_1.01,0.060211199522018435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,8,32,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,8,32,power_law_1.01,0.06594560146331788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,8,32,power_law_1.01,0.06881279945373535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,8,32,power_law_1.01,0.07618560194969178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,8,32,power_law_1.01,0.08232960104942322
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,8,32,power_law_1.01,0.10280959606170655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,8,32,power_law_1.01,0.1439743995666504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,8,32,power_law_1.01,0.1921023964881897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,8,32,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,8,32,power_law_1.01,0.29900801181793213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,8,32,power_law_1.01,0.37765119075775144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,8,32,power_law_1.01,0.5187583923339844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,8,32,power_law_1.01,0.7659520149230957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,4,power_law_1.2,26.61109619140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,8,32,power_law_1.01,1.0285056114196778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,8,32,power_law_1.01,1.6545600891113281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,8,32,power_law_1.01,2.242355155944824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,4,power_law_1.2,29.642547607421875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.06553599834442139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.07393280267715455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.2811903953552246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.4720640182495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.718233585357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.9771007537841797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,1,power_law_1.2,1.4616576194763184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,1,power_law_1.2,1.5378432273864746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,1,power_law_1.2,1.5939583778381348
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,1,power_law_1.2,1.6580608367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,1,power_law_1.2,1.739776039123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,1,power_law_1.2,1.827225685119629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,1,power_law_1.2,1.8503679275512694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,1,power_law_1.2,1.9939327239990234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,1,power_law_1.2,2.062335968017578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,1,power_law_1.2,2.1903360366821287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,1,power_law_1.2,2.311167907714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,1,power_law_1.2,2.5159679412841798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,1,power_law_1.2,2.777292823791504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,1,power_law_1.2,3.2051071166992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,1,power_law_1.2,3.661004638671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,1,power_law_1.2,4.571136093139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,1,power_law_1.2,5.47061767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,1,power_law_1.2,7.403308868408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,1,power_law_1.2,9.240985870361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,1,power_law_1.2,13.110887145996093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,1,power_law_1.2,17.080320739746092
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,16,power_law_1.01,0.6039552211761474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,16,power_law_1.01,1.0338303565979003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,16,power_law_1.01,1.5216640472412108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,16,power_law_1.01,1.398374366760254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,16,power_law_1.01,1.5187968254089355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,16,power_law_1.01,1.3883392333984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,16,power_law_1.01,1.3821951866149902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,16,power_law_1.01,1.4827520370483398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,16,power_law_1.01,1.2206080436706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,16,power_law_1.01,1.2210176467895508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,16,power_law_1.01,1.1665408134460449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,16,power_law_1.01,1.415167999267578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,16,power_law_1.01,1.470259189605713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,16,power_law_1.01,1.4206975936889648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,16,power_law_1.01,1.2697600364685058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,16,power_law_1.01,1.3965312004089356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,16,power_law_1.01,1.3385727882385254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,16,power_law_1.01,1.509990406036377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,16,power_law_1.01,1.553600025177002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,16,power_law_1.01,1.619558334350586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,16,power_law_1.01,1.7031167984008788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,16,power_law_1.01,2.045542335510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,16,power_law_1.01,2.290073585510254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,16,power_law_1.01,2.8872703552246093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,16,power_law_1.01,3.5883007049560547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,16,power_law_1.01,4.908236694335938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,16,power_law_1.01,5.902118301391601
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,16,power_law_1.01,0.6021120071411132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,16,power_law_1.01,1.0561535835266114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,16,power_law_1.01,1.559347152709961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,16,power_law_1.01,1.5120384216308593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,16,power_law_1.01,1.5568896293640138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,16,power_law_1.01,1.5589376449584962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,16,power_law_1.01,1.2867584228515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,16,power_law_1.01,1.3461440086364747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,16,power_law_1.01,1.3737728118896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,16,power_law_1.01,1.4812992095947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,16,power_law_1.01,1.3756416320800782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,16,power_law_1.01,1.346726417541504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,16,power_law_1.01,1.3291520118713378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,16,power_law_1.01,1.2613632202148437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,16,power_law_1.01,1.515110397338867
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,16,power_law_1.01,1.4055423736572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,16,power_law_1.01,1.438105583190918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,16,power_law_1.01,1.581670379638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,16,power_law_1.01,1.5898624420166017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,16,power_law_1.01,1.7367040634155273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,16,power_law_1.01,1.9744768142700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,16,power_law_1.01,2.0332544326782225
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,16,power_law_1.01,2.3949312210083007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,16,power_law_1.01,3.1743999481201173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,16,power_law_1.01,3.567820739746094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,16,power_law_1.01,5.076377487182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,16,power_law_1.01,5.948211288452148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,2,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,2,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,2,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,2,balanced,0.23176532983779907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,2,balanced,0.44697598616282147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,2,balanced,0.44918398062388104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,2,balanced,0.45124268531799316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,2,balanced,0.4534613291422526
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,2,balanced,0.45532798767089844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,2,balanced,0.4560106595357259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,2,balanced,0.460970679918925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,2,balanced,0.463701327641805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,2,balanced,0.4664320151011149
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,2,balanced,0.47377065817515057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,2,balanced,0.4910080035527547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,2,balanced,0.49646933873494464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,2,balanced,0.5084160168965658
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,2,balanced,0.5096000035603842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,2,balanced,0.539136012395223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,2,balanced,0.5964800119400024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,2,balanced,0.6456319888432821
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,2,balanced,0.7726079622904459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,2,balanced,0.92194135983785
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,2,balanced,1.2344319820404053
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,2,balanced,1.5627840360005696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,2,balanced,2.351616064707438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,2,balanced,3.137872060139974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,1,balanced,0.07611733178297679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,1,balanced,0.2879146734873454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,1,balanced,0.5348693529764811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,1,balanced,1.025877316792806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,1,balanced,2.043546676635742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,1,balanced,3.957248051961263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,1,balanced,5.908821105957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,1,balanced,5.928618748982747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,1,balanced,5.94432004292806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,1,balanced,5.966165542602539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,1,balanced,5.9999574025472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,1,balanced,6.030143737792969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,1,balanced,6.0625654856363935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,1,balanced,6.119082768758138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,1,balanced,6.173525492350261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,1,balanced,6.226773579915364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,1,balanced,6.326954523722331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,1,balanced,6.518613179524739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,1,balanced,6.70907719930013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,1,balanced,7.085397084554036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,1,balanced,7.459653218587239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,1,balanced,8.230570475260416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,1,balanced,8.801109313964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,1,balanced,10.81069310506185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,1,balanced,11.964234670003256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,16,16,balanced,0.04778666794300079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,16,16,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,16,16,balanced,0.04898133377234141
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,16,16,balanced,0.05120000243186951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,16,16,balanced,0.05495466788609823
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,1,balanced,15.006549835205078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,16,16,balanced,0.06380266447861989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,16,16,balanced,0.21640533208847046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,16,16,balanced,0.21708800395329794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,16,16,balanced,0.21947733561197916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,16,16,balanced,0.2187946637471517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,16,16,balanced,0.22064000368118286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,16,16,balanced,0.2244266668955485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,16,16,balanced,0.22459733486175537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,16,16,balanced,0.22869332631429037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,16,16,balanced,0.23517866929372153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,16,16,balanced,0.23806933561960855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,16,16,balanced,0.24644267559051514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,16,16,balanced,0.26077866554260254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,16,16,balanced,0.27986133098602295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,16,16,balanced,0.3083946704864502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,16,16,balanced,0.3457706769307454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,16,16,balanced,0.3993599812189738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,16,16,balanced,0.5031253496805826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,1,balanced,18.664447784423828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,16,16,balanced,0.7410346666971842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,16,16,balanced,0.9120426972707113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,16,16,balanced,1.4027093251546223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,16,16,balanced,1.8602453867594402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,32,2,balanced,0.030693332354227703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,32,2,balanced,0.03054400036732356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,32,2,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,32,2,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,32,2,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,32,2,balanced,0.03276266654332479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,32,2,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,32,2,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,32,2,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,32,2,balanced,0.03429333368937174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,32,2,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,32,2,balanced,0.03754666695992152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,32,2,balanced,0.038202665746212006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,32,2,balanced,0.039594667653242745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,32,2,balanced,0.05273599922657013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,32,2,balanced,0.05509866774082184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,32,2,balanced,0.06263466676076253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,32,2,balanced,0.07850666840871175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,32,2,balanced,0.09557333588600159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,32,2,balanced,0.18653867642084757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,32,2,balanced,0.25514666239420575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,32,2,balanced,0.37887998421986896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,32,2,balanced,0.5026079813639323
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,32,2,balanced,0.8038400014241537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,32,2,balanced,1.112063964207967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,32,2,balanced,1.7298773129781086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,32,2,balanced,2.35263458887736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,32,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,32,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,32,balanced,0.034815999368826546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,32,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,32,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,32,balanced,0.040448000033696495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,32,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,32,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,32,balanced,0.041984001795450844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,32,balanced,0.04215466479460398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,32,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,32,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,32,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,32,balanced,0.045567999283472695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,32,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,32,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,32,balanced,0.051882664362589516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,32,balanced,0.05750399827957153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,32,balanced,0.06502399841944377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,32,balanced,0.07833600044250488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,32,balanced,0.09591466188430786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,32,balanced,0.2146986722946167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,32,balanced,0.26845866441726685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,32,balanced,0.35089067618052167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,32,balanced,0.457045316696167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,32,balanced,0.6145706574122111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,32,balanced,0.8147626717885336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,32,balanced,0.04949333270390829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,32,balanced,0.04983466863632202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,32,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,32,balanced,0.0506879985332489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,32,balanced,0.05478399991989136
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,32,balanced,0.2996906638145447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,32,balanced,0.43195732434590656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,32,balanced,0.4346880118052165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,32,balanced,0.4363946517308553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,32,balanced,0.4375893274943034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,32,balanced,0.4408320188522339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,32,balanced,0.44509867827097577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,32,balanced,0.44731732209523517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,32,balanced,0.45533867677052814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,2,16,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,32,balanced,0.4633599917093913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,2,16,balanced,0.04642133414745331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,32,balanced,0.4720640182495117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,2,16,balanced,0.06638933221499126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,32,balanced,0.4833279848098755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,2,16,balanced,0.32460800806681317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,2,16,balanced,0.4968106746673584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,32,balanced,0.5067093372344971
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,2,16,balanced,0.5568853219350179
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,32,balanced,0.5340160131454468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,2,16,balanced,0.559440016746521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,32,balanced,0.5857280095418295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,2,16,balanced,0.5520960092544556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,2,16,balanced,0.5534720023473104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,32,balanced,0.6314666668574015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,2,16,balanced,0.5558613141377767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,2,16,balanced,0.5582506656646729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,32,balanced,0.7091200351715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,2,16,balanced,0.5635413328806559
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,2,16,balanced,0.5659306844075521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,32,balanced,0.8106666405995687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,2,16,balanced,0.5719039837519327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,2,16,balanced,0.5819733142852783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,32,balanced,1.0141013463338215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,2,16,balanced,0.5870933135350546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,2,16,balanced,0.6002346674601237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,2,16,balanced,0.6285653511683146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,32,balanced,1.2625919977823894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,2,16,balanced,0.6579200029373169
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,2,16,balanced,0.7087786992390951
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,32,balanced,1.7088853518168132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,2,16,balanced,0.7611626784006754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,2,16,balanced,0.8767146269480387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,32,balanced,2.2524587313334146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,2,16,balanced,1.0036906401316326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,2,16,balanced,1.3056000073750813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,2,16,balanced,1.577130635579427
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,2,16,balanced,2.2029546101888022
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,2,16,balanced,2.8129278818766275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,16,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,16,power_law_1.2,0.05140479803085327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,16,power_law_1.2,0.04710400104522705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,16,power_law_1.2,0.047891199588775635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,16,power_law_1.2,0.048332801461219786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,16,power_law_1.2,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,16,power_law_1.2,0.042393600940704344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,16,power_law_1.2,0.0419840008020401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,16,power_law_1.2,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,16,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,16,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,16,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,16,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,16,power_law_1.2,0.04891520142555237
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,16,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,16,power_law_1.2,0.05570560097694397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,16,power_law_1.2,0.0657151997089386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,16,power_law_1.2,0.0759552001953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,16,power_law_1.2,0.09379839897155762
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,16,power_law_1.2,0.11653120517730713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,16,power_law_1.2,0.17448960542678832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,16,power_law_1.2,0.30883839130401614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,16,power_law_1.2,0.34652159214019773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,16,power_law_1.2,0.5081088066101074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,16,power_law_1.2,0.6821887969970704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,16,power_law_1.2,1.1565055847167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,16,power_law_1.2,1.5951871871948242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,16,16,power_law_1.01,0.039526399970054624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,16,16,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,16,16,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,16,16,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,16,16,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,16,16,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,16,16,power_law_1.01,0.040755200386047366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,16,16,power_law_1.01,0.04177919924259186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,16,16,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,16,16,power_law_1.01,0.04259839951992035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,16,16,power_law_1.01,0.04321280121803284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,16,16,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,16,16,power_law_1.01,0.04524160027503967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,16,16,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,16,16,power_law_1.01,0.05079039931297302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,16,16,power_law_1.01,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,16,16,power_law_1.01,0.05631999969482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,16,16,power_law_1.01,0.06471040248870849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,16,16,power_law_1.01,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,16,16,power_law_1.01,0.08765439987182617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,16,16,power_law_1.01,0.10915839672088623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,16,16,power_law_1.01,0.15441919565200807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,16,16,power_law_1.01,0.20930559635162355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,16,16,power_law_1.01,0.3649535894393921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,16,16,power_law_1.01,0.5089280128479003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,16,16,power_law_1.01,0.8005632400512696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,16,16,power_law_1.01,1.2597248077392578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,2,2,power_law_1.2,0.032153600454330446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,2,2,power_law_1.2,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,2,2,power_law_1.2,0.22729599475860596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,2,2,power_law_1.2,0.368831992149353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,2,2,power_law_1.2,0.4583424091339111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,2,2,power_law_1.2,0.7251711845397949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,2,2,power_law_1.2,0.77226881980896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,2,2,power_law_1.2,0.8566783905029297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,2,2,power_law_1.2,0.8863743782043457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,2,2,power_law_1.2,0.8439807891845703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,2,2,power_law_1.2,0.8878080368041992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,2,2,power_law_1.2,0.8986623764038086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,2,2,power_law_1.2,0.9092927932739258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,2,2,power_law_1.2,0.9277440071105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,2,2,power_law_1.2,0.9623552322387695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,2,2,power_law_1.2,0.9879551887512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,2,2,power_law_1.2,0.9822208404541015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,2,2,power_law_1.2,1.0577919960021973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,2,2,power_law_1.2,1.113088035583496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,2,2,power_law_1.2,1.2328767776489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,2,2,power_law_1.2,1.3576191902160644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,2,2,power_law_1.2,1.683456039428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,2,2,power_law_1.2,1.824563217163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,2,2,power_law_1.2,2.4078336715698243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,2,2,power_law_1.2,2.808831977844238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,2,2,power_law_1.2,3.927449417114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,2,2,power_law_1.2,4.704460906982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,1,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,1,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,1,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,1,balanced,0.049322664737701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,1,balanced,0.23910399278004965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,1,balanced,0.25224532683690387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,1,balanced,0.25702399015426636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,1,balanced,0.26129066944122314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,1,balanced,0.26708799600601196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,1,balanced,0.26948267221450806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,1,balanced,0.2781706651051839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,1,balanced,0.28757333755493164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,1,balanced,0.2959360082944234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,1,balanced,0.30958932638168335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,1,balanced,0.32546132802963257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,1,balanced,0.343722661336263
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,1,balanced,0.35447466373443604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,1,balanced,0.4072106679280599
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,1,balanced,0.4780319929122925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,1,balanced,0.6536533435185751
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,1,balanced,0.8668159643809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,1,balanced,1.32369065284729
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,1,balanced,1.706666628519694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,1,balanced,2.4722773234049478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,1,balanced,3.2822612126668296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,1,balanced,5.017258644104004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,1,balanced,6.732800165812175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,1,balanced,0.0452106644709905
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,1,balanced,0.048810665806134544
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,1,balanced,0.14335999886194864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,1,balanced,0.34986666838328045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,1,balanced,0.6685012976328532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,1,balanced,1.3056000073750813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,1,balanced,1.3115733464558919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,1,balanced,1.3201066652933757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,1,balanced,1.3271040121714275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,1,balanced,1.3329066435496013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,1,balanced,1.3424639701843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,1,balanced,1.3533546129862468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,1,balanced,1.3624320030212402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,1,balanced,1.3827412923177083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,1,balanced,1.4085119565327961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,1,balanced,1.4288214047749836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,1,balanced,1.467898686726888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,1,balanced,1.6049493153889973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,1,balanced,1.7044480641682942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,1,balanced,1.8462613423665364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,1,balanced,2.004138628641764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,1,balanced,2.345813274383545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,16,power_law_1.01,0.3229696035385132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,16,power_law_1.01,0.5427199840545655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,1,balanced,2.7127466201782227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,16,power_law_1.01,0.787660789489746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,1,balanced,3.547306696573893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,16,power_law_1.01,0.7827455997467041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,16,power_law_1.01,0.8024064064025879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,1,balanced,4.407295862833659
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,16,power_law_1.01,0.8032256126403808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,16,power_law_1.01,0.6688767910003662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,16,power_law_1.01,0.7139328002929688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,1,balanced,6.130346934000651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,16,power_law_1.01,0.6699007987976074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,16,power_law_1.01,0.6899712085723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,16,power_law_1.01,0.7352320194244385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,1,balanced,7.862101236979167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,16,power_law_1.01,0.6692863941192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,16,power_law_1.01,0.7323647975921631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,16,power_law_1.01,0.6887423992156982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,16,power_law_1.01,0.7186431884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,16,power_law_1.01,0.8290304183959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,16,power_law_1.01,0.7548927783966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,16,power_law_1.01,0.8212479591369629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,16,power_law_1.01,0.7919616222381591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,16,power_law_1.01,0.9463808059692382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,16,power_law_1.01,0.9469951629638672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,16,power_law_1.01,1.1644927978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,16,power_law_1.01,1.3000703811645509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,16,power_law_1.01,1.7553407669067382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,16,power_law_1.01,2.286387252807617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,16,power_law_1.01,3.1436800003051757
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,16,power_law_1.01,4.0239105224609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,32,power_law_1.2,0.21073920726776124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,32,power_law_1.2,0.19107840061187745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,32,power_law_1.2,0.19271680116653442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,32,power_law_1.2,0.19394559860229493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,32,power_law_1.2,0.10711040496826171
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,32,power_law_1.2,0.05221760272979736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,32,power_law_1.2,0.17367039918899535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,32,power_law_1.2,0.07229440212249756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,32,power_law_1.2,0.15421439409255983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,32,power_law_1.2,0.09564160108566284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,32,power_law_1.2,0.13844480514526367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,32,power_law_1.2,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,32,power_law_1.2,0.15278079509735107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,32,power_law_1.2,0.12472319602966309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,32,power_law_1.2,0.16138240098953247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,32,power_law_1.2,0.19230719804763793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,32,power_law_1.2,0.208076810836792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,32,power_law_1.2,0.22300798892974855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,32,power_law_1.2,0.22773759365081786
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,32,power_law_1.2,0.2711551904678345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,32,power_law_1.2,0.3028991937637329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,32,power_law_1.2,0.3936255931854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,32,power_law_1.2,0.5195775985717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,32,power_law_1.2,0.7471104145050049
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,32,power_law_1.2,0.9795583724975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,32,power_law_1.2,1.6351232528686523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,32,power_law_1.2,2.2439807891845702
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,4,power_law_1.01,0.4399104118347168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,4,power_law_1.01,0.753868818283081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,4,power_law_1.01,0.7809023857116699
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,4,power_law_1.01,1.0248191833496094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,4,power_law_1.01,1.315839958190918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,4,power_law_1.01,1.7342464447021484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,4,power_law_1.01,1.8132991790771484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,4,power_law_1.01,1.8546688079833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,4,power_law_1.01,1.9398656845092774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,4,power_law_1.01,1.9042303085327148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,4,power_law_1.01,1.8808832168579102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,4,power_law_1.01,1.9378175735473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,4,power_law_1.01,1.9361791610717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,4,power_law_1.01,2.0215808868408205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,4,power_law_1.01,2.0424575805664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,4,power_law_1.01,2.110259246826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,4,power_law_1.01,2.2054912567138674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,4,power_law_1.01,2.2786048889160155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,4,power_law_1.01,2.4422399520874025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,4,power_law_1.01,2.671206474304199
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,4,power_law_1.01,2.9511680603027344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,4,power_law_1.01,3.5913726806640627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,4,power_law_1.01,3.989913558959961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,4,power_law_1.01,5.040947341918946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,4,power_law_1.01,6.327910232543945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,4,power_law_1.01,8.288460540771485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,4,power_law_1.01,11.328717041015626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,32,2,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,32,2,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,32,2,power_law_1.2,0.028262400627136232
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,32,2,power_law_1.2,0.02908160090446472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,32,2,power_law_1.2,0.029900801181793214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,32,2,power_law_1.2,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,32,2,power_law_1.2,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,32,2,power_law_1.2,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,32,2,power_law_1.2,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,32,2,power_law_1.2,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,32,2,power_law_1.2,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,32,2,power_law_1.2,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,32,2,power_law_1.2,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,32,2,power_law_1.2,0.05877760052680969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,32,2,power_law_1.2,0.06103039979934692
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,32,2,power_law_1.2,0.07147520184516906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,32,2,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,8,power_law_1.01,0.048742398619651794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,8,power_law_1.01,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,32,2,power_law_1.2,0.1124351978302002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,8,power_law_1.01,0.04997119903564453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,8,power_law_1.01,0.06123520135879516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,8,power_law_1.01,0.08929280042648316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,32,2,power_law_1.2,0.12001279592514039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,8,power_law_1.01,0.10629119873046874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,8,power_law_1.01,0.12471679449081421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,8,power_law_1.01,0.19804160594940184
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,8,power_law_1.01,0.16650240421295165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,8,power_law_1.01,0.19865599870681763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,8,power_law_1.01,0.1779711961746216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,8,power_law_1.01,0.19988479614257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,8,power_law_1.01,0.21135358810424804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,8,power_law_1.01,0.22402560710906982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,8,power_law_1.01,0.22690560817718505
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,8,power_law_1.01,0.24248321056365968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,8,power_law_1.01,0.2598912000656128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,8,power_law_1.01,0.28015360832214353
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,8,power_law_1.01,0.32746880054473876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,8,power_law_1.01,0.3717119932174683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,8,power_law_1.01,0.44748802185058595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,8,power_law_1.01,0.591641616821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,32,2,power_law_1.2,0.18247679471969605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,8,power_law_1.01,0.8151040077209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,8,power_law_1.01,1.0768383979797362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,8,power_law_1.01,1.5513600349426269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,32,2,power_law_1.2,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,8,power_law_1.01,2.366464042663574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,8,power_law_1.01,3.2706558227539064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,32,2,power_law_1.2,0.3821568012237549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.056729602813720706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.0681984007358551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.2428607940673828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.2406399965286255
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.24842240810394287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.2490367889404297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.24842240810394287
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.2553855895996094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.2531327962875366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.264192008972168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.2682687997817993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,32,2,power_law_1.2,0.5304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.2785279989242554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.2865151882171631
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.3072000026702881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.38727679252624514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.4325376033782959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,4,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,4,balanced,0.022858666876951855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,4,balanced,0.023210667073726654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,4,balanced,0.02454400062561035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,4,balanced,0.027477333943049114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,4,balanced,0.0288426677385966
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,4,balanced,0.0290133332212766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,4,balanced,0.029498666524887085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,4,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,4,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,4,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,4,balanced,0.03566399961709976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,4,balanced,0.0363520011305809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,4,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,4,balanced,0.04915200173854828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,4,balanced,0.05222400029500326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,4,balanced,0.07543466488520305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,4,balanced,0.08533333738644917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,4,balanced,0.17203199863433838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,4,balanced,0.24710400899251303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,4,balanced,0.34013867378234863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.49848318099975586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,4,balanced,0.4416853189468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,4,balanced,0.7195306619008383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,4,balanced,1.0738346576690674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.6791168212890625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,32,1,power_law_1.2,1.027449607849121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,32,2,power_law_1.2,0.8839167594909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,4,1,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,4,1,balanced,0.03566933423280716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,4,1,balanced,0.15598932902018228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,4,1,balanced,0.3657386700312297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,4,1,balanced,0.6981973648071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,4,1,balanced,0.9444693724314371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,4,1,balanced,0.9519786834716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,4,1,balanced,0.9545386632283529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,4,1,balanced,0.9615360101064047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,4,1,balanced,0.9644373257954916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,4,1,balanced,0.9743359883626302
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,4,1,balanced,0.9837226867675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,4,1,balanced,0.9891839822133383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,32,1,power_law_1.2,1.3922304153442382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,4,1,balanced,1.0031786759694417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,4,1,balanced,1.018181324005127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,4,1,balanced,1.0313386917114258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,4,1,balanced,1.0574506918589275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,4,1,balanced,1.0989226500193279
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,4,1,balanced,1.156768004099528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,4,1,balanced,1.248255968093872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,4,1,balanced,1.3743786811828613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,4,1,balanced,1.6317440668741863
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,4,1,balanced,1.875285307566325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,4,1,balanced,2.4026452700297036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,4,1,balanced,2.962090810139974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,14336,2,8,1,2,balanced,0.3051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,14336,2,8,1,2,balanced,0.5474986632664999
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,4,1,balanced,4.302506764729817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,14336,2,8,1,2,balanced,1.0345813433329265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,14336,2,8,1,2,balanced,1.035264015197754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,14336,2,8,1,2,balanced,1.0315093199412029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,14336,2,8,1,2,balanced,1.040554682413737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,14336,2,8,1,2,balanced,1.047210693359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,14336,2,8,1,2,balanced,1.053866704305013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,4,1,balanced,5.317290623982747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,14336,2,8,1,2,balanced,1.0600106716156006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,14336,2,8,1,2,balanced,1.0659840106964111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,14336,2,8,1,2,balanced,1.0794666608174641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,14336,2,8,1,2,balanced,1.0992639859517415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,14336,2,8,1,2,balanced,1.1122346719106038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,14336,2,8,1,2,balanced,1.1571199893951416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,14336,2,8,1,2,balanced,1.18340269724528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,14336,2,8,1,2,balanced,1.2006399631500244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,14336,2,8,1,2,balanced,1.2352533340454102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,14336,2,8,1,2,balanced,1.7527467409769695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,14336,2,8,1,2,balanced,1.8749225934346516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,14336,2,8,1,2,balanced,2.420053323109945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,14336,2,8,1,2,balanced,2.882218678792318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,14336,2,8,1,2,balanced,3.8275413513183594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,32,2,power_law_1.2,1.0594304084777832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,14336,2,8,1,2,balanced,4.837546666463216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,14336,2,8,1,2,balanced,6.7642027537028
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,14336,2,8,1,2,balanced,8.693402608235678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,14336,2,8,1,2,balanced,12.644351959228516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,14336,2,8,1,2,balanced,17.629866282145183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,32,1,power_law_1.2,2.0955135345458986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,32,1,power_law_1.2,2.775839996337891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,32,1,power_law_1.2,4.138393783569336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,32,2,power_law_1.2,1.78155517578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,1,4,power_law_1.01,0.5300288200378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,1,4,power_law_1.01,0.6330368041992187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,1,4,power_law_1.01,0.6383615970611572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,1,4,power_law_1.01,0.9410559654235839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,1,4,power_law_1.01,0.8988672256469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,1,4,power_law_1.01,0.9054207801818848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,1,4,power_law_1.01,0.9158656120300293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,1,4,power_law_1.01,0.9187328338623046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,1,4,power_law_1.01,1.1386879920959472
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,1,4,power_law_1.01,1.1472895622253418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,1,4,power_law_1.01,1.1517951965332032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,1,4,power_law_1.01,1.4118911743164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,1,4,power_law_1.01,1.5988608360290528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,1,4,power_law_1.01,1.547878360748291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,1,4,power_law_1.01,1.6955392837524415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,1,4,power_law_1.01,1.8819072723388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,1,4,power_law_1.01,2.2224895477294924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,1,4,power_law_1.01,3.0064640045166016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,1,4,power_law_1.01,3.468697738647461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,1,4,power_law_1.01,5.256601715087891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,1,4,power_law_1.01,6.533939361572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,32,2,power_law_1.2,2.9517824172973635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,32,1,power_law_1.2,5.579366302490234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,1,4,power_law_1.01,7.74676513671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,1,4,power_law_1.01,10.784563446044922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,16,power_law_1.2,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,16,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,16,power_law_1.2,0.03049600124359131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,16,power_law_1.2,0.03091840147972107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,16,power_law_1.2,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,16,power_law_1.2,0.032358399033546446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,16,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,16,power_law_1.2,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,16,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,16,power_law_1.2,0.041356799006462094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,16,power_law_1.2,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,16,power_law_1.2,0.04423680007457733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,16,power_law_1.2,0.06225919723510742
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,16,power_law_1.2,0.06778879761695862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,16,power_law_1.2,0.06799359917640686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,16,power_law_1.2,0.05692800283432007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,16,power_law_1.2,0.07004160284996033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,16,power_law_1.2,0.08785920143127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,16,power_law_1.2,0.1218559980392456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,16,power_law_1.2,0.16895999908447265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,16,power_law_1.2,0.32829439640045166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,16,power_law_1.2,0.3348479986190796
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,16,power_law_1.2,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,1,4,power_law_1.01,13.178675842285156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,16,power_law_1.2,0.8591360092163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,1,4,power_law_1.01,16.386866760253906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,4,power_law_1.01,0.2139967918395996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,4,power_law_1.01,0.35614719390869143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,4,power_law_1.01,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,4,power_law_1.01,0.5633920192718506
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,4,power_law_1.01,0.7862271785736084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,4,power_law_1.01,0.7546879768371582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,4,power_law_1.01,1.0346495628356933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,4,power_law_1.01,1.1124735832214356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,4,power_law_1.01,1.1094016075134276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,4,power_law_1.01,1.0457088470458984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,4,power_law_1.01,1.2179455757141113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,4,power_law_1.01,1.1841535568237305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,4,power_law_1.01,1.1275967597961425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,4,power_law_1.01,1.1507712364196778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,4,power_law_1.01,1.2361727714538575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,4,power_law_1.01,1.2592896461486816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,4,power_law_1.01,1.2820480346679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,4,power_law_1.01,1.397555160522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,4,power_law_1.01,1.3361151695251465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,4,power_law_1.01,1.4946304321289063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,4,power_law_1.01,1.5755135536193847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,4,power_law_1.01,1.7518400192260741
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,4,power_law_1.01,2.026291275024414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,16,power_law_1.2,1.5321087837219238
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,4,power_law_1.01,2.5769983291625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,4,power_law_1.01,3.2149505615234375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,4,power_law_1.01,4.631961441040039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,4,power_law_1.01,5.373132705688477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,1,4,power_law_1.01,22.91978302001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,1,32,power_law_1.2,0.7503871917724609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,1,32,power_law_1.2,0.7249919891357421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,1,32,power_law_1.2,0.7264256000518798
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,1,32,power_law_1.2,0.5087232112884521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,1,32,power_law_1.2,0.5160960197448731
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,1,32,power_law_1.2,0.677888011932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,1,32,power_law_1.2,0.6805503845214844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,1,32,power_law_1.2,0.7081984043121338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,1,32,power_law_1.2,0.7364480018615722
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,1,32,power_law_1.2,0.7131135940551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,1,32,power_law_1.2,0.7257791996002197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,1,32,power_law_1.2,0.7372799873352051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,1,32,power_law_1.2,0.745472002029419
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,1,32,power_law_1.2,0.809779167175293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,1,32,power_law_1.2,0.9119744300842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,1,32,power_law_1.2,0.8771583557128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,1,32,power_law_1.2,0.9373696327209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,1,32,power_law_1.2,1.0975232124328613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,1,32,power_law_1.2,1.16244478225708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,1,32,power_law_1.2,1.3496319770812988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,1,32,power_law_1.2,2.0514816284179687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,1,32,power_law_1.2,2.6826751708984373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,1,32,power_law_1.2,2.697011184692383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,1,32,power_law_1.2,4.067091369628907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,1,32,power_law_1.2,5.354496002197266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,1,4,power_law_1.01,33.91549377441406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,1,32,power_law_1.2,8.085913848876952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,1,power_law_1.2,0.04567039906978607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,1,power_law_1.2,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,1,power_law_1.2,0.17674239873886108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,1,power_law_1.2,0.32727038860321045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,1,power_law_1.2,0.475545597076416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,1,power_law_1.2,0.6309887886047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,1,32,power_law_1.2,8.691506958007812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,1,power_law_1.2,0.9674752235412598
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,1,power_law_1.2,1.001471996307373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,1,power_law_1.2,1.0293248176574707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,1,power_law_1.2,1.0676223754882812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,1,power_law_1.2,1.1425791740417481
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,1,power_law_1.2,1.1565055847167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,1,power_law_1.2,1.1646976470947266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,1,power_law_1.2,1.2472319602966309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,1,power_law_1.2,1.2957695960998534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,1,power_law_1.2,1.3432831764221191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,1,power_law_1.2,1.384447956085205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,1,power_law_1.2,1.498521614074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,1,power_law_1.2,1.6123903274536133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,1,power_law_1.2,1.7973119735717773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,1,power_law_1.2,1.9134464263916016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,1,power_law_1.2,2.2691839218139647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,1,power_law_1.2,2.7480064392089845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,1,power_law_1.2,3.5516414642333984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,1,power_law_1.2,4.078591918945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,1,power_law_1.2,5.629747009277343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,1,power_law_1.2,7.137478637695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,16,power_law_1.01,0.8183808326721191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,16,power_law_1.01,1.072537612915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,16,power_law_1.01,1.0524288177490235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,16,power_law_1.01,1.072108840942383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,16,power_law_1.01,0.9699328422546387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,16,power_law_1.01,0.9262975692749024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,16,power_law_1.01,0.9136128425598145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,16,power_law_1.01,0.9576448440551758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,16,power_law_1.01,0.9822208404541015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,16,power_law_1.01,0.9672703742980957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,16,power_law_1.01,1.0061823844909668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,16,power_law_1.01,1.0008576393127442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,16,power_law_1.01,1.0199040412902831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,16,power_law_1.01,1.0459136009216308
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,16,power_law_1.01,1.0680319786071777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,16,power_law_1.01,1.0674176216125488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,16,power_law_1.01,1.115334415435791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,16,power_law_1.01,1.1374591827392577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,16,power_law_1.01,1.2132351875305176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,16,power_law_1.01,1.3637632369995116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,16,power_law_1.01,1.5599616050720215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,16,power_law_1.2,2.1606399536132814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,16,power_law_1.01,1.964646339416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,16,power_law_1.01,1.9982336044311524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,16,power_law_1.01,2.654003143310547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,16,power_law_1.01,3.118694305419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,16,power_law_1.01,4.815667343139649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,16,power_law_1.01,6.118399810791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,16,power_law_1.2,0.024371199309825897
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,16,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,16,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,16,power_law_1.2,0.02232320010662079
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,16,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,16,power_law_1.2,0.023552000522613525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,16,power_law_1.2,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,16,power_law_1.2,0.02396160066127777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,16,power_law_1.2,0.024352000653743745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,16,power_law_1.2,0.024352000653743745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,16,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,16,power_law_1.2,0.025600001215934753
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,16,power_law_1.2,0.02600319981575012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,16,power_law_1.2,0.027852800488471986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,16,power_law_1.2,0.02969599962234497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,16,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,16,power_law_1.2,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,16,power_law_1.2,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,16,power_law_1.2,0.047513601183891294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,16,power_law_1.2,0.059596800804138185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,16,power_law_1.2,0.07106559872627258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,16,power_law_1.2,0.09912319779396057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,16,power_law_1.2,0.14970879554748534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.07024639844894409
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.23468799591064454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.3477504014968872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.4591616153717041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.7411712169647217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.7976960182189942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.8091648101806641
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.8429311752319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.8626175880432129
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.908083152770996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.9107456207275391
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.9213631629943848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.951910400390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,1,power_law_1.01,1.0045439720153808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,1,power_law_1.01,1.0158080101013183
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,1,power_law_1.01,1.0522624015808106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,1,power_law_1.01,1.1528191566467285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,16,power_law_1.2,0.3026943922042847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,1,power_law_1.01,1.2783616065979004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,1,power_law_1.01,1.5335424423217774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,1,power_law_1.01,1.8059263229370117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,1,power_law_1.01,2.330009651184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,1,power_law_1.01,2.7643903732299804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,1,power_law_1.01,3.9006206512451174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,1,power_law_1.01,4.949811172485352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,1,power_law_1.01,7.226777648925781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,1,power_law_1.01,9.58013458251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,16,power_law_1.2,0.4384768009185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,16,2,power_law_1.2,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,16,2,power_law_1.2,0.0679744005203247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,16,2,power_law_1.2,0.20336639881134033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,16,power_law_1.2,0.6285312175750732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,16,2,power_law_1.2,0.3452928066253662
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,16,2,power_law_1.2,0.3915776014328003
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,16,2,power_law_1.2,0.5445312023162842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,16,2,power_law_1.2,0.7895040035247802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,16,2,power_law_1.2,0.8605695724487304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,16,2,power_law_1.2,0.848691177368164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,16,2,power_law_1.2,0.8271807670593262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,16,2,power_law_1.2,0.9051967620849609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,16,2,power_law_1.2,0.9654272079467774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,16,2,power_law_1.2,0.9902079582214356
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,16,2,power_law_1.2,1.0127360343933105
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,16,2,power_law_1.2,1.0414079666137694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,16,2,power_law_1.2,1.11144962310791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,16,2,power_law_1.2,1.1587519645690918
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,16,2,power_law_1.2,1.3320192337036132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,16,2,power_law_1.2,1.4792448043823243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,16,2,power_law_1.2,1.7313535690307618
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,16,2,power_law_1.2,1.8728960037231446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,16,2,power_law_1.2,2.529689598083496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,16,2,power_law_1.2,3.1279104232788084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,4,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,4,power_law_1.01,0.03112959861755371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,4,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,16,2,power_law_1.2,4.166041564941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,4,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,4,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,4,power_law_1.01,0.03891200125217438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,4,power_law_1.01,0.03951359987258911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,4,power_law_1.01,0.039315199851989745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,4,power_law_1.01,0.040140798687934874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,4,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,16,2,power_law_1.2,5.0907135009765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,4,power_law_1.01,0.042803201079368594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,4,power_law_1.01,0.04485119879245758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,4,power_law_1.01,0.04792320132255554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,4,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,4,power_law_1.01,0.061849600076675414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,4,power_law_1.01,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,4,power_law_1.01,0.08601599931716919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,4,power_law_1.01,0.18800640106201172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,4,power_law_1.01,0.22036480903625488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,16,2,power_law_1.2,7.321804809570312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,4,power_law_1.01,0.2648063898086548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,4,power_law_1.01,0.32624640464782717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,4,power_law_1.01,0.45506558418273924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,4,power_law_1.01,0.7018496036529541
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,4,power_law_1.01,1.0164223670959474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,4,power_law_1.01,1.2595199584960937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,16,2,power_law_1.2,9.077760314941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,16,1,power_law_1.2,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,16,1,power_law_1.2,0.06676480174064636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,16,1,power_law_1.2,0.1255295991897583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,4,power_law_1.01,2.105548858642578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,16,1,power_law_1.2,0.2293760061264038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,16,1,power_law_1.2,0.3274751901626587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,16,1,power_law_1.2,0.5697343826293946
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,4,power_law_1.01,2.754560089111328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,16,1,power_law_1.2,0.6152192115783691
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,16,1,power_law_1.2,0.6449151992797851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,16,1,power_law_1.2,0.6662144184112548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,16,1,power_law_1.2,0.6582272052764893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,16,1,power_law_1.2,0.7053311824798584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,16,1,power_law_1.2,0.729088020324707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,16,1,power_law_1.2,0.7469056129455567
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,16,1,power_law_1.2,0.7915328025817872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,16,1,power_law_1.2,0.8243200302124023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,16,1,power_law_1.2,0.8804351806640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,16,1,power_law_1.2,0.9195520401000976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,16,1,power_law_1.2,1.0507967948913575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,16,1,power_law_1.2,1.2639936447143554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,16,1,power_law_1.2,1.5781760215759277
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,16,1,power_law_1.2,1.7856512069702148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,16,1,power_law_1.2,2.355404853820801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,16,1,power_law_1.2,2.932326316833496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,16,1,power_law_1.2,4.0687614440917965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,16,1,power_law_1.2,5.3452800750732425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,16,power_law_1.2,0.828006362915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,16,1,power_law_1.2,7.8911491394042965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,16,1,power_law_1.2,10.436793518066406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,8,8,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,8,8,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,8,8,balanced,0.04437333345413208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,8,8,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,8,8,balanced,0.05717333157857259
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,8,8,balanced,0.2940586606661479
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,8,8,balanced,0.29713066418965656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,8,8,balanced,0.2930186589558919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,8,8,balanced,0.2945706645647685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,8,8,balanced,0.29576534032821655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,8,8,balanced,0.2998613317807515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,8,8,balanced,0.304639995098114
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,8,8,balanced,0.3078826665878296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,8,8,balanced,0.31539199749628705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,8,8,balanced,0.3252906600634257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,8,8,balanced,0.33160533507664997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,8,8,balanced,0.3449173370997111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,8,8,balanced,0.37802668412526447
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,8,8,balanced,0.40908801555633545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,8,8,balanced,0.48520533243815106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,8,8,balanced,0.5480106671651205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,8,8,balanced,0.6261759996414185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,8,8,balanced,0.7623679637908936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,8,8,balanced,1.1412479877471924
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,8,8,balanced,1.586517333984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,8,8,balanced,2.29529603322347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,8,8,balanced,2.964138666788737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,32,power_law_1.2,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,32,power_law_1.2,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,32,power_law_1.2,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,32,power_law_1.2,0.22671360969543458
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,32,power_law_1.2,0.22732799053192138
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,32,power_law_1.2,0.15912959575653077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,32,power_law_1.2,0.12677119970321654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,32,power_law_1.2,0.17715200185775756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,32,power_law_1.2,0.16752640008926392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,32,power_law_1.2,0.1802240014076233
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,32,power_law_1.2,0.19824639558792115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,32,power_law_1.2,0.18431999683380126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,32,power_law_1.2,0.2283519983291626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,32,power_law_1.2,0.2174976110458374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,32,power_law_1.2,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,32,power_law_1.2,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,32,power_law_1.2,0.2672640085220337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,32,power_law_1.2,0.27975680828094485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,32,power_law_1.2,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,32,power_law_1.2,0.3952640056610107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,32,power_law_1.2,0.44605441093444825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,32,power_law_1.2,0.6195199966430665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,32,power_law_1.2,0.7192575931549072
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,32,power_law_1.2,1.0270719528198242
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,32,power_law_1.2,1.4045184135437012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,32,power_law_1.2,2.4031232833862304
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,32,power_law_1.2,3.0040063858032227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,8,2,power_law_1.01,0.0626688003540039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,8,2,power_law_1.01,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,8,2,power_law_1.01,0.40468478202819824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,8,2,power_law_1.01,0.5695487976074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,8,2,power_law_1.01,0.7051263809204101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,8,2,power_law_1.01,1.158348846435547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,8,2,power_law_1.01,1.184768009185791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,8,2,power_law_1.01,1.25665283203125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,8,2,power_law_1.01,1.2806143760681152
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,8,2,power_law_1.01,1.3170687675476074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,8,2,power_law_1.01,1.3434880256652832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,8,2,power_law_1.01,1.3774847984313965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,8,2,power_law_1.01,1.3930496215820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,8,2,power_law_1.01,1.4069760322570801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,8,2,power_law_1.01,1.4929920196533204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,8,2,power_law_1.01,1.51592960357666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,8,2,power_law_1.01,1.5542271614074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,8,2,power_law_1.01,1.678335952758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,8,2,power_law_1.01,1.8345983505249024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,8,2,power_law_1.01,2.0178943634033204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,8,2,power_law_1.01,2.1542911529541016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,8,2,power_law_1.01,2.72936954498291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,8,2,power_law_1.01,3.2937984466552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,8,2,power_law_1.01,4.448255920410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,8,2,power_law_1.01,5.279334259033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,8,2,power_law_1.01,7.338188934326172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,8,2,power_law_1.01,10.205593872070313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,2,16,power_law_1.01,0.6100992202758789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,2,16,power_law_1.01,0.7270400047302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,2,16,power_law_1.01,0.7133183956146241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,2,16,power_law_1.01,0.7260159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,2,16,power_law_1.01,0.6047743797302246
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,2,16,power_law_1.01,0.6762432098388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,2,16,power_law_1.01,0.6768640041351318
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,2,16,power_law_1.01,0.7061503887176513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,2,16,power_law_1.01,0.7213056087493896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,2,16,power_law_1.01,0.6873087882995605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,2,16,power_law_1.01,0.6656000137329101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,2,16,power_law_1.01,0.7458816051483155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,2,16,power_law_1.01,0.7133183956146241
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,2,16,power_law_1.01,0.7520256042480469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,2,16,power_law_1.01,0.7729152202606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,2,16,power_law_1.01,0.7481344223022461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,2,16,power_law_1.01,0.7919616222381591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,2,16,power_law_1.01,0.8603648185729981
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,2,16,power_law_1.01,0.9410559654235839
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,2,16,power_law_1.01,0.9998335838317871
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,2,16,power_law_1.01,1.2926976203918457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,2,16,power_law_1.01,1.5638527870178223
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,2,16,power_law_1.01,1.7557504653930665
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,2,16,power_law_1.01,2.3666688919067385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,2,16,power_law_1.01,3.178495979309082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,2,16,power_law_1.01,4.243046569824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,2,16,power_law_1.01,6.391193771362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,16,1,power_law_1.01,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,16,1,power_law_1.01,0.058982402086257935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,16,1,power_law_1.01,0.05591040253639221
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,16,1,power_law_1.01,0.24104959964752198
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,16,1,power_law_1.01,0.24596478939056396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,16,1,power_law_1.01,0.24268798828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,16,1,power_law_1.01,0.2504703998565674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,16,1,power_law_1.01,0.25231359004974363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,16,1,power_law_1.01,0.26192638874053953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,16,1,power_law_1.01,0.263372802734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,16,1,power_law_1.01,0.26521599292755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,16,1,power_law_1.01,0.27054080963134763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,16,1,power_law_1.01,0.2791296005249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,16,1,power_law_1.01,0.27688961029052733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,16,1,power_law_1.01,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,16,1,power_law_1.01,0.2979840040206909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,16,1,power_law_1.01,0.32460799217224123
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,16,1,power_law_1.01,0.3659775972366333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,16,1,power_law_1.01,0.4225024223327637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,16,1,power_law_1.01,0.5421055793762207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,16,1,power_law_1.01,0.6379519939422608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,16,1,power_law_1.01,0.9803775787353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,16,1,power_law_1.01,1.286143970489502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,16,1,power_law_1.01,1.946009635925293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,16384,2,8,16,2,power_law_1.2,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,16384,2,8,16,2,power_law_1.2,0.1136512041091919
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,16384,2,8,16,2,power_law_1.2,0.1210368037223816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,16384,2,8,16,2,power_law_1.2,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,16384,2,8,16,2,power_law_1.2,0.24248321056365968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,16384,2,8,16,2,power_law_1.2,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,16384,2,8,16,2,power_law_1.2,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,16384,2,8,16,2,power_law_1.2,0.24678399562835693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,16384,2,8,16,2,power_law_1.2,0.2500607967376709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,16384,2,8,16,2,power_law_1.2,0.2521087884902954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,16384,2,8,16,2,power_law_1.2,0.25886719226837157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,16384,2,8,16,2,power_law_1.2,0.27197439670562745
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,16384,2,8,16,2,power_law_1.2,0.28098559379577637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,16384,2,8,16,2,power_law_1.2,0.28037118911743164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,16384,2,8,16,2,power_law_1.2,0.29450240135192873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,16384,2,8,16,2,power_law_1.2,0.318668794631958
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,16384,2,8,16,2,power_law_1.2,0.3319808006286621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,16384,2,8,16,2,power_law_1.2,0.46141438484191893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,1,64,power_law_1.2,0.3289088010787964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,1,64,power_law_1.2,0.294707202911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,16384,2,8,16,2,power_law_1.2,0.45032958984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,1,64,power_law_1.2,0.2942975997924805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,1,64,power_law_1.2,0.26828799247741697
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,1,64,power_law_1.2,0.2203455924987793
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,1,64,power_law_1.2,0.210534405708313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,1,64,power_law_1.2,0.27360000610351565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,1,64,power_law_1.2,0.27607040405273436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,16384,2,8,16,2,power_law_1.2,0.6424575805664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,1,64,power_law_1.2,0.30494720935821534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,1,64,power_law_1.2,0.2930624008178711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,1,64,power_law_1.2,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,1,64,power_law_1.2,0.2994175910949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,1,64,power_law_1.2,0.30248959064483644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,1,64,power_law_1.2,0.3090431928634644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,1,64,power_law_1.2,0.31989760398864747
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,1,64,power_law_1.2,0.31252479553222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,1,64,power_law_1.2,0.3379199981689453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,1,64,power_law_1.2,0.3999743938446045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,1,64,power_law_1.2,0.4626431941986084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,1,64,power_law_1.2,0.5560319900512696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,1,64,power_law_1.2,0.7260159969329834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,2,8,power_law_1.2,0.27299840450286866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,2,8,power_law_1.2,0.24412159919738768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,2,8,power_law_1.2,0.24555521011352538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,2,8,power_law_1.2,0.24576001167297362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,2,8,power_law_1.2,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,2,8,power_law_1.2,0.2506752014160156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,2,8,power_law_1.2,0.2531327962875366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,1,64,power_law_1.2,1.0797056198120116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,2,8,power_law_1.2,0.25598080158233644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,2,8,power_law_1.2,0.26109440326690675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,2,8,power_law_1.2,0.2719360113143921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,1,64,power_law_1.2,1.3410304069519043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,2,8,power_law_1.2,0.29982719421386717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,2,8,power_law_1.2,0.35489280223846437
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,2,8,power_law_1.2,0.3362816095352173
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,1,64,power_law_1.2,2.010316848754883
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,2,8,power_law_1.2,0.36577279567718507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,2,8,power_law_1.2,0.40427517890930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,1,64,power_law_1.2,2.7639808654785156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,2,8,power_law_1.2,0.5163008213043213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,16384,2,8,16,2,power_law_1.2,0.8781632423400879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,1,64,power_law_1.2,4.986880111694336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,2,8,power_law_1.2,0.6107135772705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,2,8,power_law_1.2,0.8017919540405274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,1,64,power_law_1.2,7.665459442138672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,2,8,power_law_1.2,1.0799103736877442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,16384,2,8,16,2,power_law_1.2,1.2673024177551269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,1,4,balanced,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,1,4,balanced,0.2839893301328023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,1,4,balanced,0.5527893304824829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,1,4,balanced,1.0637653668721516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,1,4,balanced,2.061994711558024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,1,4,balanced,4.048896153767903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,16,1,power_law_1.01,2.6812416076660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,1,4,balanced,6.053887685139974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,2,8,power_law_1.2,1.4905344009399415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,1,4,balanced,5.942101160685222
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,1,4,balanced,5.951658884684245
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,1,4,balanced,5.961557388305664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,2,8,power_law_1.2,1.8378496170043945
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,1,4,balanced,5.979306538899739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,1,4,balanced,5.995007832845052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,16384,2,8,16,2,power_law_1.2,1.5986687660217285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,1,4,balanced,6.012245178222656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,1,4,balanced,6.044330596923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,1,4,balanced,6.0752213795979815
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,1,4,balanced,6.105429331461589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,1,4,balanced,6.150485356648763
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,1,4,balanced,6.246741612752278
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,2,8,power_law_1.2,2.7586559295654296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,1,4,balanced,6.331392288208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,1,4,balanced,6.488063812255859
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,1,4,balanced,6.664192199707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,1,4,balanced,7.000405629475911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,2,8,power_law_1.2,3.3384449005126955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,1,4,balanced,7.334741592407227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,1,4,balanced,7.92251714070638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,1,4,balanced,8.354133605957031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,1,4,balanced,9.859413146972656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,1,4,balanced,11.785728454589844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,16384,2,8,16,2,power_law_1.2,2.0858688354492188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,16384,2,8,16,2,power_law_1.2,3.0093311309814452
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,2,power_law_1.2,0.05939199924468994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,2,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,2,power_law_1.2,0.38686718940734866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,2,power_law_1.2,0.6447103977203369
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,2,power_law_1.2,0.858521556854248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,16,1,power_law_1.01,4.081254577636718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,2,power_law_1.2,1.0369024276733398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,2,power_law_1.2,1.4360575675964355
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,2,power_law_1.2,1.5104000091552734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,2,power_law_1.2,1.592524814605713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,2,power_law_1.2,1.7305599212646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,2,power_law_1.2,1.6650239944458007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,2,power_law_1.2,1.6748544692993164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,2,8,power_law_1.2,5.540454483032226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,2,power_law_1.2,1.8108352661132812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,2,power_law_1.2,1.862246322631836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,2,power_law_1.2,1.9191808700561523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,2,power_law_1.2,1.985331153869629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,2,power_law_1.2,2.0535295486450194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,2,power_law_1.2,2.2206464767456056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,16,1,power_law_1.01,5.485363388061524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,2,power_law_1.2,2.2769664764404296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,2,power_law_1.2,2.5133056640625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,2,power_law_1.2,2.840780830383301
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,2,power_law_1.2,3.2018367767333986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,2,power_law_1.2,3.9966720581054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,2,power_law_1.2,5.302681732177734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,2,power_law_1.2,5.824307250976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,2,power_law_1.2,8.824422454833984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,1,balanced,1.0437973340352376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,1,balanced,2.043189366658529
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,1,balanced,4.058282534281413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,1,balanced,4.062549273173015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,1,balanced,4.07807985941569
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,2,power_law_1.2,10.902118682861328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,1,balanced,4.072959899902344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,1,balanced,4.10587724049886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,1,balanced,4.140373229980469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,1,balanced,4.227072079976399
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,1,balanced,4.23850663503011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,1,balanced,4.276394526163737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,1,balanced,4.305391947428386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,1,balanced,4.319914817810059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,1,balanced,4.368725458780925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,1,balanced,6.681770960489909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,2,8,power_law_1.2,6.980608367919922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,1,balanced,6.901248296101888
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,1,balanced,7.02122688293457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,1,balanced,9.678325017293295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,1,balanced,11.133584340413412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,1,balanced,13.277013142903646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,1,balanced,15.754411061604818
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,16384,2,8,16,2,power_law_1.2,4.623769760131836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,1,balanced,19.44166437784831
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,1,balanced,23.975082397460938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,1,balanced,30.789291381835938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,1,balanced,37.917338053385414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,1,balanced,50.83989461263021
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,1,balanced,63.7675526936849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,8,power_law_1.01,0.031539198756217954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,8,power_law_1.01,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,8,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,8,power_law_1.01,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,8,power_law_1.01,0.030105599761009218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,8,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,8,power_law_1.01,0.031948798894882204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,8,power_law_1.01,0.032767999172210696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,8,power_law_1.01,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,8,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,8,power_law_1.01,0.03543039858341217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,8,power_law_1.01,0.03768320083618164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,8,power_law_1.01,0.03973119854927063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,8,power_law_1.01,0.04362240135669708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,8,power_law_1.01,0.04526079893112182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,8,power_law_1.01,0.053862398862838744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,8,power_law_1.01,0.06635519862174988
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,8,power_law_1.01,0.08069120049476623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,8,power_law_1.01,0.11796480417251587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,8,power_law_1.01,0.20746240615844727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,8,power_law_1.01,0.30126080513000486
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,8,power_law_1.01,0.41205759048461915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,8,power_law_1.01,0.6387712001800537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,8,power_law_1.01,0.9238335609436035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,8,power_law_1.01,1.5030271530151367
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,2,8,power_law_1.2,10.603314971923828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,8,power_law_1.01,1.9445760726928711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,16384,2,8,16,2,power_law_1.2,5.483315277099609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,4,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,4,power_law_1.01,0.18984960317611693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,4,power_law_1.01,0.24698879718780517
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,4,power_law_1.01,0.33873920440673827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,4,power_law_1.01,0.36925439834594725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,4,power_law_1.01,0.44011521339416504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,4,power_law_1.01,0.5343232154846191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,4,power_law_1.01,0.5349376201629639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,4,power_law_1.01,0.5468160152435303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,4,power_law_1.01,0.5695487976074218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,4,power_law_1.01,0.5783552169799805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,4,power_law_1.01,0.6086656093597412
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,4,power_law_1.01,0.6051839828491211
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,2,8,power_law_1.2,13.535232543945312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,4,power_law_1.01,0.6565887928009033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,4,power_law_1.01,0.6680575847625733
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,4,power_law_1.01,0.6721536159515381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,4,power_law_1.01,0.6555647850036621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,4,power_law_1.01,0.7129087924957276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,4,power_law_1.01,0.719052791595459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,4,power_law_1.01,0.7870463848114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,4,power_law_1.01,0.8665087699890137
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,4,power_law_1.01,1.0618880271911622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,4,power_law_1.01,1.2009471893310546
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,4,power_law_1.01,1.5073280334472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,4,power_law_1.01,1.9382272720336915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,4,power_law_1.01,2.6474496841430666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,4,power_law_1.01,3.4158592224121094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,4,2,power_law_1.01,0.24432640075683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,4,2,power_law_1.01,0.4009984016418457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,4,2,power_law_1.01,0.4868095874786377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,4,2,power_law_1.01,0.7634943962097168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,4,2,power_law_1.01,1.0307583808898926
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,4,2,power_law_1.01,1.5378432273864746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,4,2,power_law_1.01,1.6177152633666991
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,4,2,power_law_1.01,1.7424383163452148
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,4,2,power_law_1.01,1.7833984375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,4,2,power_law_1.01,1.7772544860839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,4,2,power_law_1.01,1.8155519485473632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,4,2,power_law_1.01,1.9359743118286132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,4,2,power_law_1.01,1.9372032165527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,4,2,power_law_1.01,2.0314048767089843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,4,2,power_law_1.01,2.0324352264404295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,4,2,power_law_1.01,2.088960075378418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,4,2,power_law_1.01,2.1987327575683593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,4,2,power_law_1.01,2.395955276489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,4,2,power_law_1.01,2.569011116027832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,4,2,power_law_1.01,2.95731201171875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,4,2,power_law_1.01,3.3621952056884767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,4,2,power_law_1.01,4.069171142578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,256,4,2,balanced,0.05017599960168203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,256,4,2,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,256,4,2,balanced,0.2850133379300435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,256,4,2,balanced,0.5355519851048788
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,256,4,2,balanced,1.0238293011983235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,256,4,2,balanced,2.0032854080200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,4,2,power_law_1.01,4.5348865509033205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,256,4,2,balanced,2.010453383127848
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,256,4,2,balanced,2.0495306650797525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,256,4,2,balanced,2.059936046600342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,256,4,2,balanced,2.0654080708821616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,256,4,2,balanced,2.048170725504557
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,4,2,power_law_1.01,6.094233703613281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,256,4,2,balanced,2.0674559275309243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,256,4,2,balanced,2.082304000854492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,256,4,2,balanced,2.1067093213399253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,256,4,2,balanced,2.1300907135009766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,256,4,2,balanced,2.158069292704264
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,256,4,2,balanced,2.2043306032816568
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,4,2,power_law_1.01,7.256269073486328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,256,4,2,balanced,2.304170608520508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,256,4,2,balanced,2.3872853914896646
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,256,4,2,balanced,2.570751984914144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,256,4,2,balanced,2.7750399907430015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,256,4,2,balanced,3.184634526570638
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,4,2,power_law_1.01,10.045849609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,256,4,2,balanced,3.630762736002604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,256,4,2,balanced,4.384767850240071
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,256,4,2,balanced,5.248511950174968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,256,4,2,balanced,6.955349604288737
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,4,2,power_law_1.01,13.468057250976562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,256,4,2,balanced,9.014613469441732
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,16,power_law_1.01,0.8343551635742188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,16,power_law_1.01,1.065561580657959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,16,power_law_1.01,0.9945088386535644
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,16,power_law_1.01,1.044480037689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,16,power_law_1.01,0.9752511978149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,16,power_law_1.01,1.024409580230713
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,16,power_law_1.01,0.8978431701660157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,16,power_law_1.01,0.9545727729797363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,16,power_law_1.01,0.951296043395996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,16,power_law_1.01,0.9430912017822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,16,power_law_1.01,0.9760767936706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,16,power_law_1.01,0.9439231872558593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,16,power_law_1.01,0.961945629119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,16,power_law_1.01,1.0053631782531738
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,16,power_law_1.01,1.0448896408081054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,16,power_law_1.01,1.0385408401489258
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,16,power_law_1.01,1.110630416870117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,16,power_law_1.01,1.1020288467407227
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,16,power_law_1.01,1.2486656188964844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,16,power_law_1.01,1.3903871536254884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,16,power_law_1.01,1.5034367561340332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,16,power_law_1.01,1.7786880493164063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,16,power_law_1.01,2.1372928619384766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,16,power_law_1.01,2.870681571960449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,16,power_law_1.01,3.4031551361083983
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,16,power_law_1.01,5.263359832763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,16,power_law_1.01,6.438297271728516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,1,32,power_law_1.2,1.0479616165161132
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,1,32,power_law_1.2,1.0424320220947265
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,1,32,power_law_1.2,1.0024959564208984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,1,32,power_law_1.2,1.0530816078186036
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,1,32,power_law_1.2,0.9058239936828614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,1,32,power_law_1.2,0.8347647666931153
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,1,32,power_law_1.2,1.011507225036621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,64,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,64,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,64,balanced,0.04727466901143392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,64,balanced,0.052906667192777
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,64,balanced,0.05461333195368449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,64,balanced,0.0554666668176651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,64,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,64,balanced,0.05580799778302511
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,64,balanced,0.05597866574923197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,64,balanced,0.05614933371543884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,64,balanced,0.05629866818586985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,64,balanced,0.059562668204307556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,64,balanced,0.0595413347085317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,64,balanced,0.06144000093142191
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,64,balanced,0.06417066852251689
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,64,balanced,0.06585599978764851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,1,32,power_law_1.2,0.8822784423828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,64,balanced,0.07441066702206929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,64,balanced,0.10461866855621338
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,64,balanced,0.13687466581662497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,1,32,power_law_1.2,0.9865216255187989
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,1,32,power_law_1.2,0.9611264228820801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,1,32,power_law_1.2,0.9178879737854004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,1,32,power_law_1.2,0.9541631698608398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,64,balanced,0.22323199113210043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,64,balanced,0.24251733223597208
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,1,32,power_law_1.2,1.0297344207763672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,64,balanced,0.32614399989446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,1,32,power_law_1.2,1.0720895767211913
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,64,balanced,0.3404800097147624
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,1,32,power_law_1.2,1.1269696235656739
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,64,balanced,0.45653335253397626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,1,32,power_law_1.2,1.0520575523376465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,64,balanced,0.502613345781962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,1,32,power_law_1.2,1.1339776039123535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,64,balanced,0.7289173603057861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,1,32,power_law_1.2,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,64,balanced,0.9364480177561442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,1,32,power_law_1.2,1.274227237701416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,1,32,power_law_1.2,1.618124771118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,1,32,power_law_1.2,1.7176576614379884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,1,32,power_law_1.2,2.2538240432739256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,1,32,power_law_1.2,3.0662208557128907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,1,32,power_law_1.2,4.594073486328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,2688,1856,6,128,1,64,balanced,0.04369066655635834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,2688,1856,6,128,1,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,2688,1856,6,128,1,64,balanced,0.029343999922275543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,2688,1856,6,128,1,64,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,2688,1856,6,128,1,64,balanced,0.03019733230272929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,2688,1856,6,128,1,64,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,2688,1856,6,128,1,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,2688,1856,6,128,1,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,2688,1856,6,128,1,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,2688,1856,6,128,1,64,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,2688,1856,6,128,1,64,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,2688,1856,6,128,1,64,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,2688,1856,6,128,1,64,balanced,0.03225066761175791
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,2688,1856,6,128,1,64,balanced,0.03276800115903219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,2688,1856,6,128,1,64,balanced,0.034304000437259674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,2688,1856,6,128,1,64,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,2688,1856,6,128,1,64,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,2688,1856,6,128,1,64,balanced,0.03853866706291834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,2688,1856,6,128,1,64,balanced,0.039408000806967415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,2688,1856,6,128,1,64,balanced,0.04761599997679392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,2688,1856,6,128,1,64,balanced,0.050666665037473045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,2688,1856,6,128,1,64,balanced,0.07611733178297679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,1,32,power_law_1.2,5.405900955200195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,2688,1856,6,128,1,64,balanced,0.07301333546638489
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,2688,1856,6,128,1,64,balanced,0.1160533328851064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,2688,1856,6,128,1,64,balanced,0.14011733730634054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,2688,1856,6,128,1,64,balanced,0.2681173284848531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,2688,1856,6,128,1,64,balanced,0.3309066692988078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,1,32,power_law_1.2,7.039788818359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,1,32,power_law_1.2,11.108761596679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,2,16,power_law_1.2,0.35143680572509767
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,2,16,power_law_1.2,0.3389440059661865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,2,16,power_law_1.2,0.3627007961273193
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,2,16,power_law_1.2,0.3487744092941284
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,2,16,power_law_1.2,0.3190783977508545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,2,16,power_law_1.2,0.3520512104034424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,2,16,power_law_1.2,0.3477504014968872
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,2,16,power_law_1.2,0.36433920860290525
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,2,16,power_law_1.2,0.373145604133606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,2,16,power_law_1.2,0.38236160278320314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,2,16,power_law_1.2,0.3708928108215332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,2,16,power_law_1.2,0.3975167989730835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,2,16,power_law_1.2,0.3876863956451416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,2,16,power_law_1.2,0.40960001945495605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,2,16,power_law_1.2,0.41594882011413575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,2,16,power_law_1.2,0.41614718437194825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,2,16,power_law_1.2,0.43540477752685547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,2,16,power_law_1.2,0.4618239879608154
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,2,16,power_law_1.2,0.5115776062011719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,2,16,power_law_1.2,0.6187007904052735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,2,16,power_law_1.2,0.7477248191833497
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,2,16,power_law_1.2,0.9478143692016602
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,2,16,power_law_1.2,1.356595230102539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,2,16,power_law_1.2,2.4143871307373046
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,2,16,power_law_1.2,2.4774591445922853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,16,balanced,0.027136000494162243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,16,balanced,0.02712533374627431
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,16,balanced,0.027306665976842243
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,16,balanced,0.028160000840822857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,16,balanced,0.0310506671667099
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,16,balanced,0.031744000812371574
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,16,balanced,0.031914666295051575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,16,balanced,0.032255999743938446
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,16,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,16,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,16,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,16,balanced,0.03395200024048487
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,16,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,16,balanced,0.042837331692377724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,16,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,16,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,16,balanced,0.04966400067011515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,16,balanced,0.06058666606744131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,16,balanced,0.06877866884072621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,16,balanced,0.11281067132949829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,16,balanced,0.1474560002485911
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,16,balanced,0.2773333390553792
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,16,balanced,0.3717120091120402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,16,balanced,0.6007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,16,balanced,0.8159573078155518
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,2,16,power_law_1.2,3.8942718505859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,2,16,power_law_1.2,4.928710556030273
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,8,4,power_law_1.2,0.03051519989967346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,8,4,power_law_1.2,0.030720001459121703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,8,4,power_law_1.2,0.030924800038337707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,8,4,power_law_1.2,0.031744000315666196
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,8,4,power_law_1.2,0.03522560000419617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,8,4,power_law_1.2,0.03809280097484589
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,8,4,power_law_1.2,0.04116480052471161
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,8,4,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,8,4,power_law_1.2,0.03993600010871887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,8,4,power_law_1.2,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,8,4,power_law_1.2,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,8,2,power_law_1.2,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,8,2,power_law_1.2,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,8,2,power_law_1.2,0.18124799728393554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,8,2,power_law_1.2,0.27545599937438964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,8,2,power_law_1.2,0.27873280048370364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,8,2,power_law_1.2,0.2820096015930176
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,8,2,power_law_1.2,0.2842623949050903
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,8,2,power_law_1.2,0.2883584022521973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,8,4,power_law_1.2,0.046489599347114566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,8,2,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,8,4,power_law_1.2,0.048537600040435794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,8,4,power_law_1.2,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,8,2,power_law_1.2,0.2875391960144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,8,4,power_law_1.2,0.06471679806709289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,8,2,power_law_1.2,0.30167040824890134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,8,4,power_law_1.2,0.06656000018119812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,8,2,power_law_1.2,0.29367039203643797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,8,4,power_law_1.2,0.09707520008087159
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,8,2,power_law_1.2,0.2893824100494385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,8,4,power_law_1.2,0.19333120584487914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,8,4,power_law_1.2,0.22999041080474852
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,8,4,power_law_1.2,0.2742271900177002
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,8,2,power_law_1.2,0.32767999172210693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,8,4,power_law_1.2,0.3506175994873047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,8,2,power_law_1.2,0.32911360263824463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,8,2,power_law_1.2,0.36577279567718507
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,8,2,power_law_1.2,0.34364159107208253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,8,2,power_law_1.2,0.4583424091339111
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,8,4,power_law_1.2,0.4501503944396973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,8,2,power_law_1.2,0.4958208084106445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,8,4,power_law_1.2,0.6954880237579346
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,8,2,power_law_1.2,0.7548927783966064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,8,4,power_law_1.2,1.0571776390075684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,8,2,power_law_1.2,0.8085503578186035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,8,2,power_law_1.2,1.14584321975708
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,8,4,power_law_1.2,1.2435456275939942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,8,2,power_law_1.2,1.4413824081420898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,8,4,power_law_1.2,2.2632448196411135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,8,2,power_law_1.2,2.5870336532592773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,16,1,balanced,0.04471466441949209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,16,1,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,16,1,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,16,1,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,16,1,balanced,0.15240533153216043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,16,1,balanced,0.3566879828770955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,16,1,balanced,0.36181334654490155
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,16,1,balanced,0.36300798257191974
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,16,1,balanced,0.3693173329035441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,16,1,balanced,0.3720533450444539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,16,1,balanced,0.37836798032124835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,16,1,balanced,0.3860479990641276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,16,1,balanced,0.39185067017873126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,16,1,balanced,0.40533332029978436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,16,1,balanced,0.4164266586303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,16,1,balanced,0.4288853406906128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,128,power_law_1.01,0.24002559185028077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,16,1,balanced,0.45431466897328693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,16,1,balanced,0.5131946802139282
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,128,power_law_1.01,0.21729280948638915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,128,power_law_1.01,0.21688320636749267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,128,power_law_1.01,0.21746559143066407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,128,power_law_1.01,0.18513920307159423
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,16,1,balanced,0.5698560078938802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,16,1,balanced,0.6917119820912679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,128,power_law_1.01,0.22016000747680664
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,16,1,balanced,0.8529919783274332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,128,power_law_1.01,0.2209791898727417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,128,power_law_1.01,0.2209791898727417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,128,power_law_1.01,0.22300798892974855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,128,power_law_1.01,0.22282240390777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,16,1,balanced,1.2016639709472656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,128,power_law_1.01,0.19353599548339845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,16,1,balanced,1.5184213320414226
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,128,power_law_1.01,0.2279423952102661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,16,1,balanced,2.1306026776631675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,128,power_law_1.01,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,128,power_law_1.01,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,16,1,balanced,2.7450027465820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,128,power_law_1.01,0.23633921146392822
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,128,power_law_1.01,0.23982079029083253
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,128,power_law_1.01,0.2476032018661499
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,16,1,balanced,4.042240142822266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,128,power_law_1.01,0.22547199726104736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,128,power_law_1.01,0.3059711933135986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,128,power_law_1.01,0.34259839057922364
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,16,1,balanced,5.448869069417317
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,128,power_law_1.01,0.3903359889984131
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,128,power_law_1.01,0.5257215976715088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,128,power_law_1.01,0.6532991886138916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,128,power_law_1.01,0.9373696327209473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,128,power_law_1.01,1.4780415534973144
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,128,power_law_1.01,1.9916799545288086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,128,power_law_1.01,2.4168447494506835
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,2,4,power_law_1.01,0.8214528083801269
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,2,4,power_law_1.01,1.4653440475463868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,2,4,power_law_1.01,1.492582416534424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,2,4,power_law_1.01,1.9982336044311524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,2,4,power_law_1.01,2.752511978149414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,2,4,power_law_1.01,3.5272705078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,2,4,power_law_1.01,3.5852287292480467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,2,4,power_law_1.01,3.4056190490722655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,2,4,power_law_1.01,3.5827713012695312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,2,4,power_law_1.01,3.8266880035400392
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,2,4,power_law_1.01,3.6976638793945313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,2,4,power_law_1.01,3.765248107910156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,2,4,power_law_1.01,3.96124153137207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,2,4,power_law_1.01,3.951001739501953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,8,2,power_law_1.2,3.0963712692260743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,2,4,power_law_1.01,4.210073471069336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,2,4,power_law_1.01,4.138803100585937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,2,4,power_law_1.01,4.318412780761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,2,4,power_law_1.01,4.284620666503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,2,4,power_law_1.01,4.601651382446289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,2048,768,8,128,4,64,power_law_1.2,0.022732800245285033
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,2048,768,8,128,4,64,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,2,4,power_law_1.01,4.8297985076904295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,2048,768,8,128,4,64,power_law_1.2,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,2048,768,8,128,4,64,power_law_1.2,0.02170879989862442
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,2048,768,8,128,4,64,power_law_1.2,0.021887999773025513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,2048,768,8,128,4,64,power_law_1.2,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,2048,768,8,128,4,64,power_law_1.2,0.022937600314617158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,2048,768,8,128,4,64,power_law_1.2,0.022918400168418885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,2,4,power_law_1.01,5.310259246826172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,2048,768,8,128,4,64,power_law_1.2,0.02314240038394928
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,2048,768,8,128,4,64,power_law_1.2,0.023321600258350374
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,2048,768,8,128,4,64,power_law_1.2,0.023756800591945647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,2048,768,8,128,4,64,power_law_1.2,0.024332800507545473
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,2048,768,8,128,4,64,power_law_1.2,0.02457599937915802
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,2048,768,8,128,4,64,power_law_1.2,0.02539519965648651
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,2048,768,8,128,4,64,power_law_1.2,0.027033600211143493
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,2048,768,8,128,4,64,power_law_1.2,0.027647998929023743
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,2048,768,8,128,4,64,power_law_1.2,0.029286399483680725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,2,4,power_law_1.01,6.334239959716797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,2048,768,8,128,4,64,power_law_1.2,0.03297280073165894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,2048,768,8,128,4,64,power_law_1.2,0.03624959886074066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,2048,768,8,128,4,64,power_law_1.2,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,2048,768,8,128,4,64,power_law_1.2,0.057740801572799684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,2048,768,8,128,4,64,power_law_1.2,0.08560640215873719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,2,4,power_law_1.01,6.49889907836914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,2,4,power_law_1.01,8.544255828857422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,2048,768,8,128,4,64,power_law_1.2,0.11690239906311035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,2,4,power_law_1.01,9.838182067871093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,2048,768,8,128,4,64,power_law_1.2,0.23509759902954103
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,2,4,power_law_1.01,13.285990905761718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,8,4,power_law_1.2,3.1651840209960938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,2,4,power_law_1.01,17.53495635986328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,2048,768,8,128,4,64,power_law_1.2,0.30617599487304686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,8,2,power_law_1.2,5.3284862518310545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,2048,768,8,128,4,64,power_law_1.2,0.46141438484191893
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,16,2,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,16,2,power_law_1.01,0.03133440017700195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,16,2,power_law_1.01,0.03317759931087494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,16,2,power_law_1.01,0.03498240113258362
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,16,2,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,16,2,power_law_1.01,0.04444159865379334
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,16,2,power_law_1.01,0.04628480076789856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,16,2,power_law_1.01,0.04669440090656281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,16,2,power_law_1.01,0.04933120012283325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,16,2,power_law_1.01,0.04956159889698029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,16,2,power_law_1.01,0.05181440114974976
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,16,2,power_law_1.01,0.05529599785804749
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,16,2,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,16,2,power_law_1.01,0.06696959733963012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,16,2,power_law_1.01,0.078847998380661
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,16,2,power_law_1.01,0.09994239807128906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,16,2,power_law_1.01,0.1640447974205017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,16,2,power_law_1.01,0.22466559410095216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,16,2,power_law_1.01,0.2533056020736694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,16,2,power_law_1.01,0.3221503973007202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,16,2,power_law_1.01,0.42086400985717776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,16,2,power_law_1.01,0.637337589263916
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,16,2,power_law_1.01,0.9416704177856445
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,16,2,power_law_1.01,1.396326446533203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,16,2,power_law_1.01,1.9529535293579101
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,16,2,power_law_1.01,2.9440000534057615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,16,2,power_law_1.01,4.279500961303711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,2048,768,8,128,4,64,power_law_1.2,0.7079936027526855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,8,2,power_law_1.2,6.232268905639648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,4,power_law_1.01,0.33975679874420167
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,4,power_law_1.01,0.5040128231048584
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,4,power_law_1.01,0.5455872058868408
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,4,power_law_1.01,0.8185855865478515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,4,power_law_1.01,0.9730048179626465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,4,power_law_1.01,1.1405247688293456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,4,power_law_1.01,1.2206080436706543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,4,power_law_1.01,1.2304384231567382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,4,power_law_1.01,1.2519424438476563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,4,power_law_1.01,1.235148811340332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,4,power_law_1.01,1.2881919860839843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,4,power_law_1.01,1.3283328056335448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,4,power_law_1.01,1.325260829925537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,4,power_law_1.01,1.4467071533203124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,4,power_law_1.01,1.4082048416137696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,4,power_law_1.01,1.4841856002807616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,4,power_law_1.01,1.5161343574523927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,4,power_law_1.01,1.5912960052490235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,4,power_law_1.01,1.6871423721313477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,4,power_law_1.01,1.863475227355957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,4,power_law_1.01,1.986969566345215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,4,power_law_1.01,2.490163230895996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,4,power_law_1.01,2.692505645751953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,4,power_law_1.01,3.611033630371094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,4,power_law_1.01,4.535500717163086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,4,power_law_1.01,6.31541748046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,4,power_law_1.01,9.272319793701172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,2,balanced,0.07287466526031494
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,2,balanced,0.28296534220377606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,2,balanced,0.5345280170440674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,2,balanced,1.0337279637654622
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,2,balanced,2.0285439491271973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,2,balanced,4.0168107350667315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,2,balanced,4.031488100687663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,2,balanced,4.0383148193359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,2,balanced,4.052117347717285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,2,balanced,4.063061396280925
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,2,balanced,4.069375991821289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,2,balanced,4.092074712117513
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,2,power_law_1.01,0.0421887993812561
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,2,balanced,4.106922785441081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,2,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,2,power_law_1.01,0.046079999208450316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,2,balanced,4.141056060791016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,2,power_law_1.01,0.04915199875831604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,2,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,2,power_law_1.01,0.06328319907188415
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,2,balanced,4.176213264465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,2,power_law_1.01,0.07700480222702026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,2,power_law_1.01,0.08826879858970642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,2,balanced,4.2060801188151045
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,2,power_law_1.01,0.0946175992488861
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,2,power_law_1.01,0.09093120098114013
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,2,balanced,4.280319849650065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,2,power_law_1.01,0.12779519557952881
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,2,power_law_1.01,0.12636159658432006
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,2,power_law_1.01,0.15400960445404052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,2,balanced,4.503552118937175
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,2,power_law_1.01,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,2,power_law_1.01,0.20008959770202636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,2,balanced,4.620287895202637
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,2,power_law_1.01,0.19988479614257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,2,power_law_1.01,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,2,balanced,4.840448061625163
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,2,power_law_1.01,0.26152958869934084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,2,power_law_1.01,0.29306879043579104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,2,power_law_1.01,0.3579904079437256
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,2,power_law_1.01,0.41840639114379885
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,2,balanced,5.243893305460612
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,2,power_law_1.01,0.6623231887817382
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,2,power_law_1.01,0.9029631614685059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,2,balanced,5.613738377888997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,2,power_law_1.01,1.3868927955627441
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,2,power_law_1.01,1.8458623886108398
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,2,balanced,5.932373046875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,2,power_law_1.01,2.7977727890014648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,2,balanced,7.1654402414957685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,2,power_law_1.01,3.6147201538085936
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,2,balanced,8.182954788208008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,2,balanced,10.663082758585611
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,2,balanced,13.44494883219401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,2,balanced,0.8282453219095866
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,2,balanced,1.673898696899414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,2,balanced,2.90286922454834
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,2,balanced,5.881173451741536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,2,16,balanced,0.03498666733503342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,2,16,balanced,0.03497066597143809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,2,16,balanced,0.03532800078392029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,2,16,balanced,0.03583999971548716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,2,16,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,2,16,balanced,0.1976319948832194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,2,16,balanced,0.19660800695419312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,2,16,balanced,0.19848533471425375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,2,16,balanced,0.1996799906094869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,2,16,balanced,0.1996799906094869
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,2,16,balanced,0.20258132616678873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,2,16,balanced,0.20497065782546997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,2,16,balanced,0.20462934176127115
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,2,16,balanced,0.20682666699091592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,2,16,balanced,0.21282132466634116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,2,16,balanced,0.21657600005467734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,2,16,balanced,0.22152533133824667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,2,16,balanced,0.23636800050735474
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,2,16,balanced,0.24200532833735147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,2,16,balanced,0.2645333409309387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,2,16,balanced,0.29781333605448407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,2,balanced,11.22986094156901
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,2,16,balanced,0.3490133285522461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,2,16,balanced,0.39458131790161133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,2,16,balanced,0.4756480058034261
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,2,16,balanced,0.5587626695632935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,2,16,balanced,0.7912106513977051
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,2,16,balanced,1.062058687210083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,2,balanced,16.193706512451172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,2,balanced,16.223573048909504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,2,balanced,16.243712107340496
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,2,balanced,16.28586705525716
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,2,balanced,16.311295827229817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,2,balanced,16.367956797281902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,2,balanced,16.421376546223957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,2,balanced,16.4846928914388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,2,balanced,16.56098175048828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,2,balanced,16.654165903727215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,2,balanced,16.749226888020832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,2,balanced,16.905386606852215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,2,balanced,19.320480346679688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,2,balanced,17.8517328898112
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,2,balanced,20.608341217041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,2,balanced,17.63855489095052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,2,balanced,18.7325439453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,2,balanced,19.71063486735026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,2,balanced,22.446250915527344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,2,balanced,24.28057098388672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,2,balanced,32.529919942220054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,2,balanced,38.45256551106771
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,4,32,power_law_1.2,0.22259199619293213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,4,32,power_law_1.2,0.19988479614257812
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,4,32,power_law_1.2,0.16609280109405516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,4,32,power_law_1.2,0.16773120164871216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,4,32,power_law_1.2,0.07761920094490052
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,4,32,power_law_1.2,0.16814080476760865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,4,32,power_law_1.2,0.14663679599761964
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,4,32,power_law_1.2,0.20254719257354736
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,4,32,power_law_1.2,0.20234239101409912
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,4,32,power_law_1.2,0.17448960542678832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,4,32,power_law_1.2,0.15767680406570433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,4,32,power_law_1.2,0.18391040563583375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,4,32,power_law_1.2,0.21032960414886476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,4,32,power_law_1.2,0.19619840383529663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,4,32,power_law_1.2,0.22055680751800538
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,4,32,power_law_1.2,0.22958080768585204
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,4,32,power_law_1.2,0.22609920501708985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,4,32,power_law_1.2,0.2693120002746582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,4,32,power_law_1.2,0.2917952060699463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,4,32,power_law_1.2,0.4118527889251709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,4,32,power_law_1.2,0.5378047943115234
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,4,32,power_law_1.2,0.6883327960968018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,4,32,power_law_1.2,0.981599998474121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,4,32,power_law_1.2,1.5009663581848145
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,4,32,power_law_1.2,1.9355648040771485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,4,32,power_law_1.2,2.87392635345459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,4,64,balanced,0.020138667275508244
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,4,64,balanced,0.020479999482631683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,4,64,balanced,0.019626667102177937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,4,64,balanced,0.019786667078733444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,4,64,balanced,0.019968000551064808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,4,64,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,4,64,balanced,0.020992000897725422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,4,64,balanced,0.021333334346612293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,4,64,balanced,0.021333334346612293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,4,64,balanced,0.021674667795499165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,4,64,balanced,0.02218666672706604
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,4,64,balanced,0.02252800017595291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,4,64,balanced,0.022698665658632915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,4,64,balanced,0.02388266722361247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,4,64,balanced,0.027818667391935985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,4,64,balanced,0.027989332874615986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,4,64,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,4,64,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,4,64,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,4,64,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,4,64,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,4,64,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,4,64,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,4,64,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,4,64,balanced,0.0580266664425532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,4,64,balanced,0.10871466994285583
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,4,64,balanced,0.17134400208791098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,4,32,power_law_1.2,3.695820617675781
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,4,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,4,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,4,power_law_1.01,0.04216960072517395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,4,power_law_1.01,0.0657151997089386
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,4,power_law_1.01,0.1376255989074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,4,power_law_1.01,0.20213758945465088
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,4,power_law_1.01,0.22179839611053467
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,4,power_law_1.01,0.22712318897247313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,4,power_law_1.01,0.22876160144805907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,4,power_law_1.01,0.219321608543396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,4,power_law_1.01,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,4,power_law_1.01,0.24453120231628417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,4,power_law_1.01,0.23960959911346436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,4,power_law_1.01,0.2514944076538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,4,power_law_1.01,0.25268480777740476
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,4,power_law_1.01,0.2627583980560303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,4,power_law_1.01,0.26603519916534424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,4,power_law_1.01,0.2994175910949707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,4,power_law_1.01,0.31129601001739504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,4,power_law_1.01,0.38338561058044435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,4,power_law_1.01,0.465715217590332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,4,power_law_1.01,0.7110655784606934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,4,power_law_1.01,0.9113599777221679
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,4,power_law_1.01,1.273855972290039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,4096,1536,8,128,2,128,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,4096,1536,8,128,2,128,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,4096,1536,8,128,2,128,balanced,0.029525332152843475
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,4096,1536,8,128,2,128,balanced,0.029861333469549816
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,4096,1536,8,128,2,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,4096,1536,8,128,2,128,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,4096,1536,8,128,2,128,balanced,0.03089066594839096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,4096,1536,8,128,2,128,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,4096,1536,8,128,2,128,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,4096,1536,8,128,2,128,balanced,0.0315733328461647
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,4,power_law_1.01,1.7305599212646485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,4096,1536,8,128,2,128,balanced,0.03259733319282532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,4096,1536,8,128,2,128,balanced,0.03310933212439219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,4096,1536,8,128,2,128,balanced,0.03328000009059906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,4096,1536,8,128,2,128,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,4096,1536,8,128,2,128,balanced,0.03618133316437403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,4096,1536,8,128,2,128,balanced,0.036858665446440377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,4096,1536,8,128,2,128,balanced,0.03857066730658213
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,4096,1536,8,128,2,128,balanced,0.04113066693147024
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,4096,1536,8,128,2,128,balanced,0.04334933559099833
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,4096,1536,8,128,2,128,balanced,0.0481279989083608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,4096,1536,8,128,2,128,balanced,0.05358933409055074
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,4,power_law_1.01,2.7082752227783202
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,4096,1536,8,128,2,128,balanced,0.06774933139483134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,4096,1536,8,128,2,128,balanced,0.12970667084058127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,4096,1536,8,128,2,128,balanced,0.27357866366704303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,4096,1536,8,128,2,128,balanced,0.34833065668741864
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,4,power_law_1.01,3.424256134033203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,4096,1536,8,128,2,128,balanced,0.5565439860026041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,4096,1536,8,128,2,128,balanced,0.7343786557515463
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,256,power_law_1.2,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,256,power_law_1.2,0.050380802154541014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,256,power_law_1.2,0.05058559775352478
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,256,power_law_1.2,0.05139840245246887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,256,power_law_1.2,0.05242879986763001
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,256,power_law_1.2,0.05283839702606201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,256,power_law_1.2,0.05324800014495849
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,256,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,4096,2688,22,512,1,128,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,256,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,256,power_law_1.2,0.054067200422286986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,4096,2688,22,512,1,128,power_law_1.01,0.062054401636123656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,256,power_law_1.2,0.05509120225906372
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,256,power_law_1.2,0.0591871976852417
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,4096,2688,22,512,1,128,power_law_1.01,0.059385597705841064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,256,power_law_1.2,0.061440002918243405
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,256,power_law_1.2,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,4096,2688,22,512,1,128,power_law_1.01,0.05263360142707825
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,256,power_law_1.2,0.07536640167236328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,4096,2688,22,512,1,128,power_law_1.01,0.054681599140167236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,256,power_law_1.2,0.07741439938545228
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,4096,2688,22,512,1,128,power_law_1.01,0.05304319858551025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,4096,2688,22,512,1,128,power_law_1.01,0.05427200198173523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,256,power_law_1.2,0.10280959606170655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,4096,2688,22,512,1,128,power_law_1.01,0.05488640069961548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,256,power_law_1.2,0.1363968014717102
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,4096,2688,22,512,1,128,power_law_1.01,0.054476797580718994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,256,power_law_1.2,0.16874879598617554
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,4096,2688,22,512,1,128,power_law_1.01,0.056524801254272464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,4096,2688,22,512,1,128,power_law_1.01,0.056934398412704465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,256,power_law_1.2,0.2807807922363281
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,4096,2688,22,512,1,128,power_law_1.01,0.06164479851722717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,256,power_law_1.2,0.38051838874816896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,4096,2688,22,512,1,128,power_law_1.01,0.06574079990386963
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,4096,2688,22,512,1,128,power_law_1.01,0.07270399928092956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,256,power_law_1.2,0.5615615844726562
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,4096,2688,22,512,1,128,power_law_1.01,0.08929280042648316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,4096,2688,22,512,1,128,power_law_1.01,0.09479680061340331
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,256,power_law_1.2,0.7376895904541015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,4096,2688,22,512,1,128,power_law_1.01,0.13230079412460327
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,4096,2688,22,512,1,128,power_law_1.01,0.1837056040763855
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,256,power_law_1.2,1.0852352142333985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,4096,2688,22,512,1,128,power_law_1.01,0.21114881038665773
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,4096,2688,22,512,1,128,power_law_1.01,0.2879487991333008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,4096,2688,22,512,1,128,power_law_1.01,0.35161600112915037
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,256,power_law_1.2,1.6936960220336914
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,4096,2688,22,512,1,128,power_law_1.01,0.5224448204040527
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,4096,2688,22,512,1,128,power_law_1.01,0.5789696216583252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,256,power_law_1.2,2.653183937072754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,4096,2688,22,512,1,128,power_law_1.01,0.8566656112670898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,4096,2688,22,512,1,128,power_law_1.01,1.1599871635437011
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,4096,2688,22,512,1,128,power_law_1.01,1.7967103958129882
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,128,power_law_1.01,2.7064319610595704
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,4096,2688,22,512,1,256,power_law_1.2,3.93175048828125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,16384,2,8,4,4,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,16384,2,8,4,4,balanced,0.03976533313592275
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,16384,2,8,4,4,balanced,0.24729599555333456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,16384,2,8,4,4,balanced,0.24832000335057577
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,16384,2,8,4,4,balanced,0.24967465798060098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,16384,2,8,4,4,balanced,0.2510506709416707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,16384,2,8,4,4,balanced,0.2532426714897156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,16384,2,8,4,4,balanced,0.248799999554952
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,16384,2,8,4,4,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,16384,2,8,4,4,balanced,0.2524159948031108
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,16384,2,8,4,4,balanced,0.2606079975763957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,16384,2,8,4,4,balanced,0.26368000109990436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,16384,2,8,4,4,balanced,0.26641066869099933
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,16384,2,8,4,4,balanced,0.26826133330663043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,16384,2,8,4,4,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,16384,2,8,4,4,balanced,0.29337600866953534
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,16384,2,8,4,4,balanced,0.2805759906768799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,16384,2,8,4,4,balanced,0.3324586749076843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,16384,2,8,4,4,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,16384,2,8,4,4,balanced,0.4911786715189616
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,16384,2,8,4,4,balanced,0.5778773228327433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,16384,2,8,4,4,balanced,0.8495786984761556
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,16384,2,8,4,4,balanced,1.1327146689097087
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,16384,2,8,4,4,balanced,1.6766293843587239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,16384,2,8,4,4,balanced,2.245120048522949
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,16384,2,8,4,4,balanced,3.3960959116617837
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,16384,2,8,4,4,balanced,4.507477442423503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,2,power_law_1.01,0.06512640118598938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,2,power_law_1.01,0.29552640914916994
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,2,power_law_1.01,0.5439487934112549
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,2,power_law_1.01,0.7059328079223632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,2,power_law_1.01,1.0582015991210938
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,2,power_law_1.01,1.4843903541564942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,2,power_law_1.01,1.609721565246582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,2,power_law_1.01,2.185420799255371
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,2,power_law_1.01,2.1983104705810548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,2,power_law_1.01,2.244812774658203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,2,power_law_1.01,2.307481575012207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,2,power_law_1.01,2.4582143783569337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,2,power_law_1.01,2.5167871475219727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,2,power_law_1.01,2.510643196105957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,2,power_law_1.01,2.550374412536621
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,2,power_law_1.01,2.5405439376831054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,2,power_law_1.01,2.772991943359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,2,power_law_1.01,2.882559967041016
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,2,power_law_1.01,3.0763008117675783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,2,power_law_1.01,3.3230846405029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,2,power_law_1.01,3.544473648071289
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,2,power_law_1.01,3.993600082397461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,2,power_law_1.01,4.428595352172851
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,2,power_law_1.01,5.409587097167969
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,2,power_law_1.01,6.609101104736328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,2,power_law_1.01,8.866201782226563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,2,power_law_1.01,10.90355224609375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,4,64,balanced,0.050517335534095764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,4,64,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,4,64,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,4,64,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,4,64,balanced,0.05239466826121012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,4,64,balanced,0.05870933334032694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,4,64,balanced,0.05853866537412008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,4,64,balanced,0.05905066430568695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,4,64,balanced,0.059392000238100685
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,4,64,balanced,0.0653653343518575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,4,64,balanced,0.060415998101234436
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,4,64,balanced,0.06775466601053874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,4,64,balanced,0.0631466656923294
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,4,64,balanced,0.06963199873765309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,4,64,balanced,0.07338666419188182
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,4,64,balanced,0.07458133498827617
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,4,64,balanced,0.07867733140786488
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,4,64,balanced,0.12151466806729634
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,4,64,balanced,0.15291733543078104
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,4,64,balanced,0.19541333119074503
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,4,64,balanced,0.2198186715443929
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,4,64,balanced,0.2657279968261719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,4,64,balanced,0.31829333305358887
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,4,64,balanced,0.4345173438390096
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,4,64,balanced,0.5369173288345337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,4,64,balanced,0.7632213433583578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,4,64,balanced,1.030997355779012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,2,16,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,2,16,balanced,0.023893333971500397
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,2,16,balanced,0.02457600086927414
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,2,16,balanced,0.025429333249727886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,2,16,balanced,0.02679466704527537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,2,16,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,2,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,2,16,balanced,0.030037333567937214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,2,16,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,2,16,balanced,0.030207999050617218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,2,16,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,2,16,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,2,16,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,2,16,balanced,0.03222399950027466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,2,16,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,2,16,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,2,16,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,2,16,balanced,0.04454400142033895
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,2,16,balanced,0.04420266548792521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,2,16,balanced,0.06007466713587443
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,2,16,balanced,0.06363733112812042
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,2,16,balanced,0.0988159974416097
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,2,16,balanced,0.16449600458145142
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,2,16,balanced,0.2645333409309387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,2,16,balanced,0.3222186764081319
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,2,16,balanced,0.4775253136952718
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,2,16,balanced,0.6391466856002808
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,2,16,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,2,16,balanced,0.0365226666132609
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,2,16,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,2,16,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,2,16,balanced,0.1493333379427592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,2,16,balanced,0.3556533257166545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,2,16,balanced,0.3575466473897298
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,2,16,balanced,0.3548159996668498
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,2,16,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,2,16,balanced,0.35652267932891846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,2,16,balanced,0.3580586512883504
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,2,16,balanced,0.359935998916626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,2,16,balanced,0.36164267857869464
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,2,16,balanced,0.36505599816640216
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,2,16,balanced,0.3694933255513509
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,2,16,balanced,0.37170668443044025
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,2,16,balanced,0.37700267632802326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,2,16,balanced,0.39133866628011066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,2,16,balanced,0.40482131640116376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,2,16,balanced,0.40960001945495605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,2,16,balanced,0.4358826478322347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,2,16,balanced,0.48793598016103107
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,2,16,balanced,0.5205333232879639
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,2,16,balanced,0.6179840167363485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,2,16,balanced,0.6826666990915934
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,2,16,balanced,0.9530026912689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,2,16,balanced,1.2093439896901448
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,6144,2560,8,160,16,2,power_law_1.01,0.058976000547409056
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,6144,2560,8,160,16,2,power_law_1.01,0.06717439889907836
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,6144,2560,8,160,16,2,power_law_1.01,0.18821120262145996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,6144,2560,8,160,16,2,power_law_1.01,0.321727991104126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,6144,2560,8,160,16,2,power_law_1.01,0.39935998916625975
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,6144,2560,8,160,16,2,power_law_1.01,0.606169605255127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,6144,2560,8,160,16,2,power_law_1.01,0.6309887886047363
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,6144,2560,8,160,16,2,power_law_1.01,0.6561791896820068
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,6144,2560,8,160,16,2,power_law_1.01,0.6547135829925537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,6144,2560,8,160,16,2,power_law_1.01,0.6653952121734619
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,6144,2560,8,160,16,2,power_law_1.01,0.7301119804382324
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,6144,2560,8,160,16,2,power_law_1.01,0.7493247985839844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,6144,2560,8,160,16,2,power_law_1.01,0.7536448001861572
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,6144,2560,8,160,16,2,power_law_1.01,0.7655104160308838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,6144,2560,8,160,16,2,power_law_1.01,0.7817215919494629
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,6144,2560,8,160,16,2,power_law_1.01,0.828006362915039
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,6144,2560,8,160,16,2,power_law_1.01,0.8708095550537109
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,6144,2560,8,160,16,2,power_law_1.01,0.9500543594360351
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,6144,2560,8,160,16,2,power_law_1.01,1.042636775970459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,6144,2560,8,160,16,2,power_law_1.01,1.244979190826416
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,6144,2560,8,160,16,2,power_law_1.01,1.4647295951843262
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,6144,2560,8,160,16,2,power_law_1.01,1.937984085083008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,6144,2560,8,160,16,2,power_law_1.01,2.32857608795166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,6144,2560,8,160,16,2,power_law_1.01,3.3920703887939454
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,6144,2560,8,160,16,2,power_law_1.01,4.284620666503907
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,6144,2560,8,160,16,2,power_law_1.01,6.3518718719482425
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,6144,2560,8,160,16,2,power_law_1.01,8.211436462402343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,1,16,balanced,0.036687999963760376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,1,16,balanced,0.03669333209594091
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,1,16,balanced,0.037717332442601524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,1,16,balanced,0.03942399968703588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,1,16,balanced,0.16127999623616537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,1,16,balanced,0.370688001314799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,1,16,balanced,0.3722240130106608
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,1,16,balanced,0.36113067468007404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,1,16,balanced,0.36266668637593585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,1,16,balanced,0.36266668637593585
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,1,16,balanced,0.3648853302001953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,1,16,balanced,0.3672746817270915
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,1,16,balanced,0.3686399857203166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,1,16,balanced,0.3720533450444539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,1,16,balanced,0.3838133414586385
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,1,16,balanced,0.37905065218607586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,1,16,balanced,0.3860479990641276
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,1,16,balanced,0.4005546569824219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,1,16,balanced,0.4148906469345093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,1,16,balanced,0.4416853189468384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,1,16,balanced,0.46779731909434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,1,16,balanced,0.5201919873555502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,1,16,balanced,0.5766826470692953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,1,16,balanced,0.6727680365244547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,1,16,balanced,0.7906986872355143
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,32,2,power_law_1.2,0.05980160236358643
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,32,2,power_law_1.2,0.06430720090866089
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,1,16,balanced,1.0816853046417236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,32,2,power_law_1.2,0.0729088008403778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,32,2,power_law_1.2,0.13783040046691894
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,32,2,power_law_1.2,0.2260672092437744
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,32,2,power_law_1.2,0.28671998977661134
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,32,2,power_law_1.2,0.40673279762268066
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,1,16,balanced,1.4021973609924316
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,32,2,power_law_1.2,0.43581438064575195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,32,2,power_law_1.2,0.4427775859832764
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,32,2,power_law_1.2,0.45035519599914553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,32,2,power_law_1.2,0.4724736213684082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,32,2,power_law_1.2,0.4874239921569824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,32,2,power_law_1.2,0.5042175769805908
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,32,2,power_law_1.2,0.5513216018676758
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,32,2,power_law_1.2,0.5728256225585937
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,32,2,power_law_1.2,0.6090752124786377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,32,2,power_law_1.2,0.6672383785247803
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,32,2,power_law_1.2,0.7786496162414551
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,32,2,power_law_1.2,0.8796159744262695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,32,2,power_law_1.2,1.126195240020752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,32,2,power_law_1.2,1.408409595489502
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,32,2,power_law_1.2,1.965670394897461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,32,2,power_law_1.2,2.612211227416992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,32,2,power_law_1.2,3.4062335968017576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,32,2,power_law_1.2,5.227315139770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,32,2,power_law_1.2,6.755123138427734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,32,2,power_law_1.2,9.059942626953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,14336,2,8,1,1,power_law_1.01,1.0299391746520996
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,14336,2,8,1,1,power_law_1.01,1.7403903961181642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,14336,2,8,1,1,power_law_1.01,2.6603519439697267
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,14336,2,8,1,1,power_law_1.01,3.765856170654297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,14336,2,8,1,1,power_law_1.01,4.0796161651611325
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,14336,2,8,1,1,power_law_1.01,4.105587387084961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,14336,2,8,1,1,power_law_1.01,4.369203186035156
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,14336,2,8,1,1,power_law_1.01,4.844543838500977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,14336,2,8,1,1,power_law_1.01,4.9702911376953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,14336,2,8,1,1,power_law_1.01,5.2172798156738285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,14336,2,8,1,1,power_law_1.01,4.824063873291015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,14336,2,8,1,1,power_law_1.01,5.048697662353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,14336,2,8,1,1,power_law_1.01,5.31025276184082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,14336,2,8,1,1,power_law_1.01,6.177177429199219
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,14336,2,8,1,1,power_law_1.01,6.874713897705078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,14336,2,8,1,1,power_law_1.01,6.988595581054687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,14336,2,8,1,1,power_law_1.01,8.382259368896484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,14336,2,8,1,1,power_law_1.01,10.314752197265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,14336,2,8,1,1,power_law_1.01,11.606797027587891
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,14336,2,8,1,1,power_law_1.01,14.13201904296875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,14336,2,8,1,1,power_law_1.01,16.207872009277345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,1,1,power_law_1.2,1.6023551940917968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,1,1,power_law_1.2,2.8229631423950194
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,1,1,power_law_1.2,5.7221118927001955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,1,1,power_law_1.2,8.91637725830078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,1,power_law_1.01,0.4478975772857666
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,1,power_law_1.01,0.7622655868530274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,1,power_law_1.01,1.455718421936035
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,1,power_law_1.01,2.5081855773925783
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,1,1,power_law_1.2,12.881510925292968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,1,power_law_1.01,3.6847614288330077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,1,power_law_1.01,6.108364868164062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,14336,2,8,1,1,power_law_1.01,20.814028930664062
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,1,power_law_1.01,6.541311645507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,1,1,power_law_1.2,23.40167694091797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,1,power_law_1.01,6.803040313720703
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,1,power_law_1.01,6.887014770507813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,1,power_law_1.01,7.073177337646484
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,1,power_law_1.01,7.357023620605469
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,1,1,power_law_1.2,25.355059814453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1,4096,2688,22,512,4,4,power_law_1.2,0.4366335868835449
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,1,power_law_1.01,7.581696319580078
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2,4096,2688,22,512,4,4,power_law_1.2,0.5736447811126709
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4,4096,2688,22,512,4,4,power_law_1.2,0.7684095859527588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8,4096,2688,22,512,4,4,power_law_1.2,0.9879551887512207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,1,power_law_1.01,7.643341064453125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16,4096,2688,22,512,4,4,power_law_1.2,1.2034048080444335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,14336,2,8,1,1,power_law_1.01,24.748646545410157
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,32,4096,2688,22,512,4,4,power_law_1.2,1.9429311752319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,48,4096,2688,22,512,4,4,power_law_1.2,1.743052864074707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,1,power_law_1.01,7.875993347167968
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,1,1,power_law_1.2,26.4079345703125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,64,4096,2688,22,512,4,4,power_law_1.2,1.8411520004272461
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,4,4,power_law_1.2,1.7786880493164063
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,4,4,power_law_1.2,1.842790412902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,1,power_law_1.01,8.2302978515625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,4,4,power_law_1.2,1.8739200592041017
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,4,4,power_law_1.2,1.9662847518920898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,4,4,power_law_1.2,2.008678436279297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,1,power_law_1.01,8.436736297607421
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,4,4,power_law_1.2,2.148966407775879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,32,2,balanced,0.03958933303753535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,32,2,balanced,0.04061333338419596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,32,2,balanced,0.04249600072701772
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,32,2,balanced,0.04659200211366018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,32,2,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,32,2,balanced,0.18602667252222696
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,4,4,power_law_1.2,2.166374397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,32,2,balanced,0.187391996383667
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,32,2,balanced,0.1889280080795288
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,32,2,balanced,0.19063466787338257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,32,2,balanced,0.19165867567062378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,32,2,balanced,0.1950719952583313
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,32,2,balanced,0.19933867454528809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,32,2,balanced,0.20104533433914185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,32,2,balanced,0.212991992632548
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,32,2,balanced,0.22169599930445352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,4,4,power_law_1.2,2.2151168823242187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,32,2,balanced,0.22732800245285034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,1,power_law_1.01,8.700927734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,32,2,balanced,0.23449599742889404
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,80,4096,2688,22,512,1,1,power_law_1.2,27.030938720703126
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,32,2,balanced,0.26521599292755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,32,2,balanced,0.30702932675679523
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,32,2,balanced,0.3592533270517985
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,32,2,balanced,0.4179626703262329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,4,4,power_law_1.2,2.2747135162353516
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,32,2,balanced,0.6070613463719686
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,32,2,balanced,0.838485320409139
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,4,power_law_1.2,2.3326719284057615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,32,2,balanced,1.3134506543477376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,32,2,balanced,1.771008014678955
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,4,1,power_law_1.01,9.061785888671874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,4,power_law_1.2,2.4793088912963865
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,32,2,balanced,2.6842454274495444
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,4,power_law_1.2,2.7801599502563477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,14336,2,8,1,1,power_law_1.01,31.14700927734375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,32,2,balanced,3.6058454513549805
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,4,power_law_1.2,3.1748096466064455
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,4,1,power_law_1.01,9.383936309814453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,4,power_law_1.2,3.987865447998047
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,96,4096,2688,22,512,1,1,power_law_1.2,28.289434814453124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,4,1,power_law_1.01,9.954713439941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,4,power_law_1.2,4.364492797851563
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,4,power_law_1.2,5.372518539428711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,4,1,power_law_1.01,11.06329574584961
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,4,power_law_1.2,6.702899169921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,128,4096,2688,22,512,1,1,power_law_1.2,29.118875122070314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,4,1,power_law_1.01,13.153689575195312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,4,power_law_1.2,9.588326263427735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,4,1,power_law_1.01,14.379621887207032
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,160,4096,2688,22,512,1,1,power_law_1.2,29.850830078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,4,1,power_law_1.01,18.51084747314453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,4,power_law_1.2,12.626534271240235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,14336,2,8,1,1,power_law_1.01,37.9936767578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,192,4096,2688,22,512,1,1,power_law_1.2,30.969854736328124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,4,1,power_law_1.01,21.86792907714844
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,256,4096,2688,22,512,1,1,power_law_1.2,32.179815673828124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,4,1,power_law_1.01,30.077542114257813
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,320,4096,2688,22,512,1,1,power_law_1.2,33.27508544921875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,4,1,power_law_1.01,37.44460754394531
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,384,4096,2688,22,512,1,1,power_law_1.2,33.812686157226565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,512,4096,2688,22,512,1,1,power_law_1.2,34.856756591796874
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,8,1,power_law_1.01,0.04464640021324158
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,8,1,power_law_1.01,0.04935680031776428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,8,1,power_law_1.01,0.16650240421295165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,8,1,power_law_1.01,0.3463167905807495
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,8,1,power_law_1.01,0.5193727970123291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,8,1,power_law_1.01,0.6590144157409668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,8,1,power_law_1.01,0.9703424453735352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,8,1,power_law_1.01,1.0250240325927735
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,8,1,power_law_1.01,1.0536767959594726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,8,1,power_law_1.01,1.0760191917419433
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,8,1,power_law_1.01,1.0870783805847168
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,768,4096,2688,22,512,1,1,power_law_1.2,37.473690795898435
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,8,1,power_law_1.01,1.1522047996520997
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,8,1,power_law_1.01,1.1718655586242677
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,8,1,power_law_1.01,1.218560028076172
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,8,1,power_law_1.01,1.239039993286133
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,8,1,power_law_1.01,1.2697600364685058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,8,1,power_law_1.01,1.3346816062927247
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,8,1,power_law_1.01,1.4428159713745117
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,8,1,power_law_1.01,1.5278079986572266
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,8,1,power_law_1.01,1.7352703094482422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,8,1,power_law_1.01,1.9126272201538086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,8,1,power_law_1.01,2.3064191818237303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,8,1,power_law_1.01,2.6947519302368166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,8,1,power_law_1.01,3.584819030761719
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1024,4096,2688,22,512,1,1,power_law_1.2,37.566873168945314
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,8,1,power_law_1.01,4.35937271118164
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,8,1,power_law_1.01,6.196428680419922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,8,1,power_law_1.01,7.808396911621093
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,1536,4096,2688,22,512,1,1,power_law_1.2,40.514764404296876
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,14336,2,8,1,1,power_law_1.01,51.832818603515626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,2048,4096,2688,22,512,1,1,power_law_1.2,40.45762634277344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,6144,2560,8,160,8,2,power_law_1.01,0.04976640045642853
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,6144,2560,8,160,8,2,power_law_1.01,0.06983680129051209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,6144,2560,8,160,8,2,power_law_1.01,0.1896448016166687
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,6144,2560,8,160,8,2,power_law_1.01,0.3082240104675293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,6144,2560,8,160,8,2,power_law_1.01,0.3446784019470215
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,6144,2560,8,160,8,2,power_law_1.01,0.5677055835723877
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,6144,2560,8,160,8,2,power_law_1.01,0.5906432151794434
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,6144,2560,8,160,8,2,power_law_1.01,0.5976064205169678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,6144,2560,8,160,8,2,power_law_1.01,0.6490111827850342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,6144,2560,8,160,8,2,power_law_1.01,0.6524928092956543
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,6144,2560,8,160,8,2,power_law_1.01,0.6727680206298828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,3072,4096,2688,22,512,1,1,power_law_1.2,45.257318115234376
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,6144,2560,8,160,8,2,power_law_1.01,0.6887423992156982
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,6144,2560,8,160,8,2,power_law_1.01,0.7116799831390381
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,6144,2560,8,160,8,2,power_law_1.01,0.7133056163787842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,6144,2560,8,160,8,2,power_law_1.01,0.7614463806152344
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,6144,2560,8,160,8,2,power_law_1.01,0.7856128215789795
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,6144,2560,8,160,8,2,power_law_1.01,0.8458239555358886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,6144,2560,8,160,8,2,power_law_1.01,0.9156607627868653
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,6144,2560,8,160,8,2,power_law_1.01,1.004748821258545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,6144,2560,8,160,8,2,power_law_1.01,1.202995204925537
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,6144,2560,8,160,8,2,power_law_1.01,1.4125056266784668
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,6144,2560,8,160,8,2,power_law_1.01,1.8305023193359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,6144,2560,8,160,8,2,power_law_1.01,2.087321662902832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,6144,2560,8,160,8,2,power_law_1.01,2.8588031768798827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,6144,2560,8,160,8,2,power_law_1.01,3.785318374633789
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,6144,2560,8,160,8,2,power_law_1.01,5.4626304626464846
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,4096,4096,2688,22,512,1,1,power_law_1.2,48.009420776367186
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,6144,2560,8,160,8,2,power_law_1.01,7.192371368408203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,6144,4096,2688,22,512,1,1,power_law_1.2,58.39708251953125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,8192,4096,2688,22,512,1,1,power_law_1.2,69.14088745117188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,12288,4096,2688,22,512,1,1,power_law_1.2,90.1054443359375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,14336,2,8,1,1,power_law_1.01,64.5265380859375
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,4,balanced,0.02184533327817917
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,4,balanced,0.021503999829292297
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,4,balanced,0.023039999107519787
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,4,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,4,balanced,0.2321066657702128
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,4,balanced,0.23603200912475586
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,4,balanced,0.2367146611213684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,4,balanced,0.2373973329861959
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,4,balanced,0.2387626568476359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,4,balanced,0.2387626568476359
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,4,balanced,0.23756800095240274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,4,balanced,0.23961599667867026
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,4,balanced,0.2409813404083252
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,4,balanced,0.24593067169189453
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,4,balanced,0.2512213389078776
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,4,balanced,0.25446399052937824
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,4,balanced,0.2595840096473694
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,4,balanced,0.2691413362820943
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,4,balanced,0.28040534257888794
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,4,balanced,0.28996266921361286
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,4,balanced,0.31726932525634766
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,4,balanced,0.3802453279495239
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,4,balanced,0.4227413336435954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,4,balanced,0.5922133525212606
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,4,balanced,0.7927467028299967
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,4,balanced,1.245184024175008
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,4,balanced,1.6513546307881672
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,float16,16384,4096,2688,22,512,1,1,power_law_1.2,101.43621215820312
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,8,4,balanced,0.034474665919939675
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,8,4,balanced,0.03515733281771342
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,8,4,balanced,0.03601066768169403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,8,4,balanced,0.038058665891488395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,8,4,balanced,0.04386133452256521
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,8,4,balanced,0.2167466680208842
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,8,4,balanced,0.1960960030555725
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,8,4,balanced,0.19694934288660684
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,8,4,balanced,0.19830934206644693
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,8,4,balanced,0.19898666938145956
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,8,4,balanced,0.20104533433914185
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,8,4,balanced,0.20548266172409058
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,8,4,balanced,0.20837867259979248
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,8,4,balanced,0.21179733673731485
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,8,4,balanced,0.2177706758181254
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,8,4,balanced,0.22101332743962607
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,8,4,balanced,0.2307413419087728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,8,4,balanced,0.2513920068740845
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,8,4,balanced,0.2653866608937581
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,8,4,balanced,0.3041226665178935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,8,4,balanced,0.35037867228190106
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,8,4,balanced,0.4087466796239217
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,8,4,balanced,0.4833279848098755
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,8,4,balanced,0.679253339767456
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,8,4,balanced,0.8978772958119711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,8,4,balanced,1.4180693626403809
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,8,4,balanced,1.9665919939676921
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,2,2,power_law_1.2,0.6141632080078125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,2,2,power_law_1.2,1.0450943946838378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,2,2,power_law_1.2,1.6089088439941406
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,2,2,power_law_1.2,2.4596416473388674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,2,2,power_law_1.2,4.194099044799804
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,2,2,power_law_1.2,5.4611968994140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,384,8,8,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,384,8,8,balanced,0.05034666756788889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,384,8,8,balanced,0.05376000205675761
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,384,8,8,balanced,0.06689066688219707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,384,8,8,balanced,0.2757973273595174
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,2,2,power_law_1.2,6.266265487670898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,384,8,8,balanced,0.5434026718139648
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,384,8,8,balanced,0.797696034113566
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,8,8,balanced,0.7990612983703613
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,8,8,balanced,0.801093339920044
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,8,8,balanced,0.8029867013295492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,8,8,balanced,0.8053759733835856
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,8,8,balanced,0.8045226732889811
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,8,8,balanced,0.8065706888834635
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,8,8,balanced,0.8139093716939291
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,8,8,balanced,0.8231253623962402
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,384,2,2,power_law_1.2,8.397004699707031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,8,8,balanced,0.831658681233724
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,8,8,balanced,0.8526399930318197
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,8,8,balanced,0.8835413455963135
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,8,8,balanced,0.9239892959594727
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,8,8,balanced,0.9925973415374756
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,8,8,balanced,1.06222931543986
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,8,8,balanced,1.230847994486491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,8,8,balanced,1.407317320505778
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,384,2,2,power_law_1.2,8.751923370361329
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,8,8,balanced,1.7626454035441081
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,8,8,balanced,2.1087573369344077
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,8,8,balanced,2.8305066426595054
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,384,2,2,power_law_1.2,8.629657745361328
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,8,8,balanced,3.552586555480957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,384,2,2,power_law_1.2,9.079193878173829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,384,2,2,power_law_1.2,9.480397033691407
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,384,2,2,power_law_1.2,9.581158447265626
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,384,2,2,power_law_1.2,10.07941131591797
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,2048,768,8,128,2,1,balanced,0.02644266684850057
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,2048,768,8,128,2,1,balanced,0.03362133353948593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,2048,768,8,128,2,1,balanced,0.23481067021687826
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,2048,768,8,128,2,1,balanced,0.44697598616282147
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,2048,768,8,128,2,1,balanced,0.8726186752319336
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,2048,768,8,128,2,1,balanced,0.8777386347452799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,2048,768,8,128,2,1,balanced,0.8816586335500082
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,2048,768,8,128,2,1,balanced,0.8854186534881592
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,384,2,2,power_law_1.2,10.1285888671875
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,2048,768,8,128,2,1,balanced,0.8908639748891195
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,2048,768,8,128,2,1,balanced,0.8925866285959879
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,2048,768,8,128,2,1,balanced,0.9014613628387451
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,2048,768,8,128,2,1,balanced,0.9152746995290121
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,2048,768,8,128,2,1,balanced,0.9231359958648682
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,2048,768,8,128,2,1,balanced,0.9383253256479899
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,2048,768,8,128,2,1,balanced,0.973311980565389
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,2048,768,8,128,2,1,balanced,1.0016427040100098
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,2048,768,8,128,2,1,balanced,1.0170026620229085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,2048,768,8,128,2,1,balanced,1.043946663538615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,2048,768,8,128,2,1,balanced,1.0994346936543782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,384,2,2,power_law_1.2,10.22894058227539
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,2048,768,8,128,2,1,balanced,1.2153173287709553
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,2048,768,8,128,2,1,balanced,1.3410986264546711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,2048,768,8,128,2,1,balanced,1.611946741739909
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,2048,768,8,128,2,1,balanced,1.8662080764770508
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,2048,768,8,128,2,1,balanced,2.3983786900838218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,2048,768,8,128,2,1,balanced,3.0257492065429688
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,384,2,2,power_law_1.2,10.569932556152343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,2048,768,8,128,2,1,balanced,4.561578750610352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,2048,768,8,128,2,1,balanced,6.073514938354492
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,384,2,2,power_law_1.2,11.951718139648438
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,384,2,2,power_law_1.2,11.9385986328125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,384,2,2,power_law_1.2,12.773580932617188
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,384,2,2,power_law_1.2,13.34517822265625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,384,2,2,power_law_1.2,14.431642150878906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,384,2,2,power_law_1.2,16.961088562011717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,384,2,2,power_law_1.2,20.019795227050782
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,384,2,2,power_law_1.2,22.89171142578125
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,384,2,2,power_law_1.2,30.449868774414064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1,2688,1856,6,128,1,128,balanced,0.028330666323502857
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2,2688,1856,6,128,1,128,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4,2688,1856,6,128,1,128,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8,2688,1856,6,128,1,128,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16,2688,1856,6,128,1,128,balanced,0.02867199977238973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,32,2688,1856,6,128,1,128,balanced,0.029696000119050343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,48,2688,1856,6,128,1,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,64,2688,1856,6,128,1,128,balanced,0.029866665601730347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,80,2688,1856,6,128,1,128,balanced,0.03242666771014532
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,96,2688,1856,6,128,1,128,balanced,0.030378667016824085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,128,2688,1856,6,128,1,128,balanced,0.030720000465710957
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,160,2688,1856,6,128,1,128,balanced,0.031061333914597828
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,192,2688,1856,6,128,1,128,balanced,0.0314026673634847
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,256,2688,1856,6,128,1,128,balanced,0.032074667513370514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,320,2688,1856,6,128,1,128,balanced,0.0341333324710528
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,384,2688,1856,6,128,1,128,balanced,0.034645333886146545
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,512,2688,1856,6,128,1,128,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,768,2688,1856,6,128,1,128,balanced,0.03737599899371465
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1024,2688,1856,6,128,1,128,balanced,0.03874133278926214
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,1536,2688,1856,6,128,1,128,balanced,0.04248533149560293
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,2048,2688,1856,6,128,1,128,balanced,0.045738667249679565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,3072,2688,1856,6,128,1,128,balanced,0.054101333022117615
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,4096,2688,1856,6,128,1,128,balanced,0.062458669145902
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,6144,2688,1856,6,128,1,128,balanced,0.12731732924779257
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,8192,2688,1856,6,128,1,128,balanced,0.23534933725992838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,12288,2688,1856,6,128,1,128,balanced,0.3432106574376424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_nongated,fp8,16384,2688,1856,6,128,1,128,balanced,0.4805973370869954
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,384,2,2,power_law_1.2,30.84656677246094
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,32,8,power_law_1.01,0.035206401348114015
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,32,8,power_law_1.01,0.03399679958820343
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,32,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,32,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,32,8,power_law_1.01,0.033792001008987424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,32,8,power_law_1.01,0.03604480028152466
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,32,8,power_law_1.01,0.03663359880447388
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,32,8,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,32,8,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,32,8,power_law_1.01,0.037887999415397645
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,32,8,power_law_1.01,0.03932160139083862
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,32,8,power_law_1.01,0.04012160003185272
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,32,8,power_law_1.01,0.040345600247383116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,32,8,power_law_1.01,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,32,8,power_law_1.01,0.045849600434303285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,32,8,power_law_1.01,0.04894720017910004
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,32,8,power_law_1.01,0.051596802473068235
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,32,8,power_law_1.01,0.06082559823989868
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,32,8,power_law_1.01,0.06593279838562012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,32,8,power_law_1.01,0.08455680012702942
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,32,8,power_law_1.01,0.14724479913711547
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,32,8,power_law_1.01,0.2928639888763428
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,32,8,power_law_1.01,0.43724799156188965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,32,8,power_law_1.01,0.6993919849395752
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,32,8,power_law_1.01,0.961945629119873
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,32,8,power_law_1.01,1.5361791610717774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,2,8,power_law_1.01,0.3250175952911377
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,32,8,power_law_1.01,2.2411264419555663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,2,8,power_law_1.01,0.5443583965301514
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,2,8,power_law_1.01,1.0577919960021973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,2,8,power_law_1.01,0.9459712028503418
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,2,8,power_law_1.01,1.2339008331298829
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,2,8,power_law_1.01,1.3699071884155274
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,2,8,power_law_1.01,1.0041343688964843
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,2,8,power_law_1.01,1.125990390777588
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,2,8,power_law_1.01,1.2644351959228515
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,2,8,power_law_1.01,1.3082624435424806
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,2,8,power_law_1.01,1.2103679656982422
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,2,8,power_law_1.01,1.4635007858276368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,2,8,power_law_1.01,1.4272512435913085
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,2,8,power_law_1.01,1.3135871887207031
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,2,8,power_law_1.01,1.3725695610046387
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,2,8,power_law_1.01,1.4524415969848632
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,2,8,power_law_1.01,1.409830379486084
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,2,8,power_law_1.01,1.538047981262207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,2,8,power_law_1.01,1.5271936416625977
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,2,8,power_law_1.01,1.7098560333251953
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,2,8,power_law_1.01,1.7043455123901368
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,2,8,power_law_1.01,2.0490240097045898
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,2,8,power_law_1.01,2.2550527572631838
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,2,8,power_law_1.01,2.820076751708984
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,2,8,power_law_1.01,3.540582275390625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,2,8,power_law_1.01,4.813619232177734
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,2,8,power_law_1.01,5.951078414916992
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,3072,1536,8,256,4,32,balanced,0.03345066557327906
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,3072,1536,8,256,4,32,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,3072,1536,8,256,4,32,balanced,0.03379199902216593
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,3072,1536,8,256,4,32,balanced,0.0339626669883728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,3072,1536,8,256,4,32,balanced,0.03549866626660029
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,3072,1536,8,256,4,32,balanced,0.03925333420435587
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,3072,1536,8,256,4,32,balanced,0.040106666584809623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,3072,1536,8,256,4,32,balanced,0.04027733455101649
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,3072,1536,8,256,4,32,balanced,0.040789333482583366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,3072,1536,8,256,4,32,balanced,0.04095999896526337
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,3072,1536,8,256,4,32,balanced,0.04147200038035711
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,3072,1536,8,256,4,32,balanced,0.04266666869322459
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,3072,1536,8,256,4,32,balanced,0.043007999658584595
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,3072,1536,8,256,4,32,balanced,0.044031997521718345
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,3072,1536,8,256,4,32,balanced,0.04693333307902018
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,3072,1536,8,256,4,32,balanced,0.04744533201058706
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,3072,1536,8,256,4,32,balanced,0.051029334465662636
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,3072,1536,8,256,4,32,balanced,0.05819733440876007
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,3072,1536,8,256,4,32,balanced,0.06075733403364817
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,3072,1536,8,256,4,32,balanced,0.07508799930413564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,3072,1536,8,256,4,32,balanced,0.08191999793052673
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,3072,1536,8,256,4,32,balanced,0.1237333317597707
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,3072,1536,8,256,4,32,balanced,0.13004799683888754
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,3072,1536,8,256,4,32,balanced,0.2677759925524394
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,3072,1536,8,256,4,32,balanced,0.307370662689209
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,3072,1536,8,256,4,32,balanced,0.45721598466237384
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,3072,1536,8,256,4,32,balanced,0.5928959846496582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,8,4,balanced,0.028501334289709728
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,8,4,balanced,0.02918400118748347
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,8,4,balanced,0.031231999397277832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,8,4,balanced,0.036864000062147774
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,8,4,balanced,0.23637332518895468
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,8,4,balanced,0.23910399278004965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,8,4,balanced,0.2392746607462565
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,8,4,balanced,0.24115200837453207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,8,4,balanced,0.24132267634073892
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,8,4,balanced,0.24268800020217896
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,8,4,balanced,0.24490666389465332
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,8,4,balanced,0.2698240081469218
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,8,4,balanced,0.25036799907684326
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,8,4,balanced,0.253440002600352
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,8,4,balanced,0.2621440092722575
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,8,4,balanced,0.26521599292755127
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,8,4,balanced,0.27716267108917236
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,8,4,balanced,0.2836479942003886
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,8,4,balanced,0.30242133140563965
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,8,4,balanced,0.3524266481399536
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,8,4,balanced,0.37597866853078205
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,8,4,balanced,0.53111465771993
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,8,4,balanced,0.697002649307251
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,8,4,balanced,1.059658686319987
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,8,4,balanced,1.3963947296142578
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,4096,1536,8,128,8,4,balanced,2.1021013259887695
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,4096,1536,8,128,8,4,balanced,2.7397066752115884
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,7168,2048,8,384,4,8,power_law_1.2,0.05836799740791321
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,7168,2048,8,384,4,8,power_law_1.2,0.29183359146118165
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,7168,2048,8,384,4,8,power_law_1.2,0.4040703773498535
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,7168,2048,8,384,4,8,power_law_1.2,0.44564480781555177
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,7168,2048,8,384,4,8,power_law_1.2,0.628326416015625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,7168,2048,8,384,4,8,power_law_1.2,0.6864895820617676
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,7168,2048,8,384,4,8,power_law_1.2,0.7395199775695801
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,7168,2048,8,384,4,8,power_law_1.2,0.7045119762420654
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,7168,2048,8,384,4,8,power_law_1.2,0.6602752208709717
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,7168,2048,8,384,4,8,power_law_1.2,0.7077888011932373
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,7168,2048,8,384,4,8,power_law_1.2,0.6381247997283935
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,7168,2048,8,384,4,8,power_law_1.2,0.693452787399292
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,7168,2048,8,384,4,8,power_law_1.2,0.6674431800842285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,7168,2048,8,384,4,8,power_law_1.2,0.7186431884765625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,7168,2048,8,384,4,8,power_law_1.2,0.6832128047943116
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1,3072,1536,8,256,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2,3072,1536,8,256,4,64,power_law_1.01,0.03583999872207642
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,7168,2048,8,384,4,8,power_law_1.2,0.6785024166107178
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4,3072,1536,8,256,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,7168,2048,8,384,4,8,power_law_1.2,0.7731200218200683
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8,3072,1536,8,256,4,64,power_law_1.01,0.034406399726867674
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16,3072,1536,8,256,4,64,power_law_1.01,0.035020801424980166
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,7168,2048,8,384,4,8,power_law_1.2,0.8206336021423339
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,32,3072,1536,8,256,4,64,power_law_1.01,0.03563520014286041
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,7168,2048,8,384,4,8,power_law_1.2,0.8988672256469726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,48,3072,1536,8,256,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,64,3072,1536,8,256,4,64,power_law_1.01,0.0364544004201889
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,7168,2048,8,384,4,8,power_law_1.2,0.9981951713562012
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,80,3072,1536,8,256,4,64,power_law_1.01,0.03665919899940491
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,96,3072,1536,8,256,4,64,power_law_1.01,0.03686400055885315
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,7168,2048,8,384,4,8,power_law_1.2,1.057151985168457
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,128,3072,1536,8,256,4,64,power_law_1.01,0.037478399276733396
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,160,3072,1536,8,256,4,64,power_law_1.01,0.03870719969272614
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,7168,2048,8,384,4,8,power_law_1.2,1.305177593231201
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,192,3072,1536,8,256,4,64,power_law_1.01,0.03911679983139038
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,256,3072,1536,8,256,4,64,power_law_1.01,0.040550398826599124
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,320,3072,1536,8,256,4,64,power_law_1.01,0.04382719993591309
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,7168,2048,8,384,4,8,power_law_1.2,1.5861760139465333
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,384,3072,1536,8,256,4,64,power_law_1.01,0.04505600035190582
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,512,3072,1536,8,256,4,64,power_law_1.01,0.04730879962444305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,768,3072,1536,8,256,4,64,power_law_1.01,0.05550079941749573
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,7168,2048,8,384,4,8,power_law_1.2,1.9974143981933594
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1024,3072,1536,8,256,4,64,power_law_1.01,0.06492159962654113
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,1536,3072,1536,8,256,4,64,power_law_1.01,0.07557119727134705
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,2048,3072,1536,8,256,4,64,power_law_1.01,0.0954367995262146
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,3072,3072,1536,8,256,4,64,power_law_1.01,0.13148159980773927
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,7168,2048,8,384,4,8,power_law_1.2,2.740224075317383
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,4096,3072,1536,8,256,4,64,power_law_1.01,0.1662976026535034
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,6144,3072,1536,8,256,4,64,power_law_1.01,0.339353609085083
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,8192,3072,1536,8,256,4,64,power_law_1.01,0.4132863998413086
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,7168,2048,8,384,4,8,power_law_1.2,3.7617664337158203
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,12288,3072,1536,8,256,4,64,power_law_1.01,0.6135807991027832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,3072,1536,8,256,4,64,power_law_1.01,0.9170944213867187
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,fp8,16384,7168,2048,8,384,4,8,power_law_1.2,4.8175102233886715
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,4096,1536,8,128,2,16,power_law_1.2,0.23162879943847656
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1,7168,2048,8,256,8,8,power_law_1.01,0.06840320229530335
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,4096,1536,8,128,2,16,power_law_1.2,0.18350080251693726
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,4096,1536,8,128,2,16,power_law_1.2,0.18145279884338378
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2,7168,2048,8,256,8,8,power_law_1.01,0.2869247913360596
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,4096,1536,8,128,2,16,power_law_1.2,0.19517439603805542
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4,7168,2048,8,256,8,8,power_law_1.01,0.3493504047393799
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,4096,1536,8,128,2,16,power_law_1.2,0.09809920191764832
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,4096,1536,8,128,2,16,power_law_1.2,0.22302720546722413
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8,7168,2048,8,256,8,8,power_law_1.01,0.39915521144866944
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,4096,1536,8,128,2,16,power_law_1.2,0.22753279209136962
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,4096,1536,8,128,2,16,power_law_1.2,0.24412159919738768
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16,7168,2048,8,256,8,8,power_law_1.01,0.4175871849060059
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,4096,1536,8,128,2,16,power_law_1.2,0.23879680633544922
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,32,7168,2048,8,256,8,8,power_law_1.01,0.45752320289611814
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,4096,1536,8,128,2,16,power_law_1.2,0.2332672119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,4096,1536,8,128,2,16,power_law_1.2,0.24350719451904296
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,48,7168,2048,8,256,8,8,power_law_1.01,0.42741761207580564
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,4096,1536,8,128,2,16,power_law_1.2,0.24494080543518065
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,64,7168,2048,8,256,8,8,power_law_1.01,0.4501503944396973
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,4096,1536,8,128,2,16,power_law_1.2,0.2527231931686401
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,80,7168,2048,8,256,8,8,power_law_1.01,0.46284799575805663
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,4096,1536,8,128,2,16,power_law_1.2,0.2531327962875366
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,4096,1536,8,128,2,16,power_law_1.2,0.25436160564422605
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,96,7168,2048,8,256,8,8,power_law_1.01,0.5056511878967285
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,4096,1536,8,128,2,16,power_law_1.2,0.260096001625061
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,128,7168,2048,8,256,8,8,power_law_1.01,0.49049601554870603
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,4096,1536,8,128,2,16,power_law_1.2,0.28405759334564207
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,4096,1536,8,128,2,16,power_law_1.2,0.2875391960144043
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,160,7168,2048,8,256,8,8,power_law_1.01,0.48619518280029295
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,192,7168,2048,8,256,8,8,power_law_1.01,0.48762879371643064
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,4096,1536,8,128,2,16,power_law_1.2,0.32706561088562014
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,4096,1536,8,128,2,16,power_law_1.2,0.42024960517883303
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,256,7168,2048,8,256,8,8,power_law_1.01,0.5212160110473633
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,4096,1536,8,128,2,16,power_law_1.2,0.5079040050506591
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,320,7168,2048,8,256,8,8,power_law_1.01,0.5402624130249023
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,384,7168,2048,8,256,8,8,power_law_1.01,0.5666816234588623
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,512,7168,2048,8,256,8,8,power_law_1.01,0.5396480083465576
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,4096,1536,8,128,2,16,power_law_1.2,0.659660816192627
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,768,7168,2048,8,256,8,8,power_law_1.01,0.6135488033294678
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,4096,1536,8,128,2,16,power_law_1.2,0.8834943771362305
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1024,7168,2048,8,256,8,8,power_law_1.01,0.6362751960754395
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,1536,7168,2048,8,256,8,8,power_law_1.01,0.7532415866851807
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,2048,7168,2048,8,256,8,8,power_law_1.01,0.8288000106811524
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,3072,7168,2048,8,256,8,8,power_law_1.01,1.0172415733337403
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,4096,7168,2048,8,256,8,8,power_law_1.01,1.2627967834472655
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,7168,2048,8,256,8,8,power_law_1.01,1.7797119140625
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,6144,4096,1536,8,128,2,16,power_law_1.2,1.355776023864746
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,7168,2048,8,256,8,8,power_law_1.01,2.3339008331298827
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,12288,7168,2048,8,256,8,8,power_law_1.01,3.2050945281982424
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,16384,7168,2048,8,256,8,8,power_law_1.01,4.078796768188477
TRTLLM,1.2.0rc5,NVIDIA L40S,moe,moe_torch_flow_cutlass,float16,8192,4096,1536,8,128,2,16,power_law_1.2,1.9181568145751953
