framework,version,device,op_name,kernel_source,allreduce_dtype,num_gpus,message_size,latency,backend
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,128,0.006865599751472473,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,128,0.05142528057098389,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,256,0.007024319767951965,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,256,0.051682558059692386,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,512,0.0070191997289657596,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,512,0.050025920867919925,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,1024,0.007056319713592529,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,1024,0.04799520015716553,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,2048,0.006849600076675415,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,2048,0.049043521881103516,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,4096,0.0070304000377655025,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,4096,0.048411197662353515,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,8192,0.007024639844894409,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,8192,0.04782080173492432,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,16384,0.007024319767951965,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,16384,0.04728896141052246,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,32768,0.007048959732055664,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,32768,0.04763936042785645,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,65536,0.0074406397342681885,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,65536,0.05803391933441162,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,131072,0.00763264000415802,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,131072,0.057207679748535155,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,262144,0.009471039772033691,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,262144,0.048589439392089845,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,524288,0.013157440423965456,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,524288,0.04984992027282715,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,1048576,0.021022400856018066,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,1048576,0.04781119823455811,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,2097152,0.03520031929016113,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,2097152,0.04799488067626953,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,4194304,0.06324607849121093,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,4194304,0.07401631832122803,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,8388608,0.05624063968658447,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,8388608,0.14052127838134765,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,16777216,0.0830515193939209,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,16777216,0.11218079566955566,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,33554432,0.1509017562866211,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,33554432,0.17257919311523437,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,67108864,0.2781587219238281,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,67108864,0.3186908721923828,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,134217728,0.5203263854980469,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,134217728,0.6002195358276368,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,268435456,0.9630413055419922,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,268435456,1.125022430419922,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,2,536870912,1.8468293762207033,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,2,536870912,2.1620147705078123,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,128,0.007013440132141113,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,128,0.05613696098327636,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,256,0.007383040189743043,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,256,0.05005440235137939,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,512,0.007414079904556274,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,512,0.0480457592010498,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,1024,0.007406719923019408,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,1024,0.04801055908203125,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,2048,0.007048959732055664,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,2048,0.04548543930053711,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,4096,0.007523840069770813,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,4096,0.045223360061645505,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,8192,0.007419520020484923,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,8192,0.04525599956512451,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,16384,0.007433279752731323,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,16384,0.044870400428771974,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,32768,0.0076108801364898684,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,32768,0.045146241188049316,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,65536,0.008032640218734741,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,65536,0.044517440795898436,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,131072,0.008654720187187196,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,131072,0.04437535762786865,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,262144,0.018258559703826904,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,262144,0.04544191837310791,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,524288,0.01940287947654724,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,524288,0.04479807853698731,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,1048576,0.029377920627593996,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,1048576,0.046648321151733396,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,2097152,0.04638368129730225,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,2097152,0.05729856014251709,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,4194304,0.07874112129211426,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,4194304,0.08913599967956543,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,8388608,0.07685728073120117,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,8388608,0.10526816368103027,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,16777216,0.12292960166931152,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,16777216,0.13125311851501464,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,33554432,0.18308256149291993,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,33554432,0.20481311798095705,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,67108864,0.349615364074707,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,67108864,0.39116031646728516,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,134217728,0.6763827514648437,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,134217728,0.7559490966796875,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,268435456,1.3006591796875,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,268435456,1.4549990844726561,sglang_eager
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_graph,float16,4,536870912,2.5547640991210936,sglang_graph
SGLang,0.5.9,NVIDIA GB300,all_reduce,SGLang_CustomAllReduce_eager,float16,4,536870912,2.8646557617187502,sglang_eager
