framework,version,device,op_name,kernel_source,quant_type,num_token,hidden_size,intermediate_size,avg_ms
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,1,7168,2048,0.03152959942817688
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,2,7168,2048,0.030694401264190672
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,4,7168,2048,0.030112001299858093
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,8,7168,2048,0.02932479977607727
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,16,7168,2048,0.02876160144805908
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,32,7168,2048,0.030035200715065002
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,64,7168,2048,0.030243200063705445
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,128,7168,2048,0.03234240114688873
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,256,7168,2048,0.03817279934883118
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,512,7168,2048,0.054876798391342164
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,1024,7168,2048,0.0902783989906311
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,2048,7168,2048,0.16336640119552612
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,4096,7168,2048,0.2962975978851318
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,8192,7168,2048,0.5778687953948974
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,16384,7168,2048,1.129856014251709
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,32768,7168,2048,2.2135360717773436
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,65536,7168,2048,4.355340957641602
SGLang,0.5.8.post1,NVIDIA H100 80GB HBM3,mlp,deepseek_v3,fp8_block,131072,7168,2048,8.945289611816406
