framework,version,device,op_name,kernel_source,allreduce_dtype,num_gpus,message_size,latency,backend
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,128,0.006195200085639953,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,128,0.018498879671096802,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,256,0.006206719875335694,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,256,0.018422720432281495,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,512,0.006153600215911865,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,512,0.01840831995010376,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,1024,0.006179519891738892,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,1024,0.01856768012046814,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,2048,0.00658240020275116,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,2048,0.018389760255813598,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,4096,0.006416640281677247,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,4096,0.018645440340042112,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,8192,0.006593919992446899,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,8192,0.017954879999160768,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,16384,0.0068371200561523435,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,16384,0.017920000553131105,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,32768,0.007114560008049012,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,32768,0.03394752025604248,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,65536,0.0074169600009918206,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,65536,0.01830623984336853,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,131072,0.00753279983997345,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,131072,0.018362239599227906,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,262144,0.00944383978843689,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,262144,0.019939839839935303,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,524288,0.01351744055747986,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,524288,0.023418240547180176,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,1048576,0.021010239124298096,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,1048576,0.024808320999145508,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,2097152,0.0394540810585022,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,2097152,0.03995264053344726,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,4194304,0.04547264099121094,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,4194304,0.045923838615417475,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,8388608,0.05754591941833496,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,8388608,0.05945280075073243,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,16777216,0.08444448471069335,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,16777216,0.09672096252441406,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,33554432,0.1526252841949463,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,33554432,0.17513343811035156,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,67108864,0.2792755126953125,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,67108864,0.321860466003418,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,134217728,0.526032943725586,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,134217728,0.608575668334961,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,268435456,1.0029046630859375,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,268435456,1.1695410919189453,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,536870912,1.9070259094238282,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,536870912,2.232901153564453,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,128,0.007426880002021789,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,128,0.01965791940689087,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,256,0.007282559871673584,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,256,0.020254719257354736,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,512,0.007069439888000488,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,512,0.02047391891479492,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,1024,0.00713696002960205,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,1024,0.02020128011703491,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,2048,0.007410240173339844,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,2048,0.019608319997787477,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,4096,0.007370880246162415,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,4096,0.01963263988494873,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,8192,0.007521600127220154,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,8192,0.01916383981704712,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,16384,0.007804800271987915,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,16384,0.019081920385360718,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,32768,0.00800927996635437,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,32768,0.01929311990737915,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,65536,0.008003519773483276,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,65536,0.01922656059265137,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,131072,0.008414720296859742,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,131072,0.019587839841842654,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,262144,0.0179312002658844,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,262144,0.028250880241394043,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,524288,0.0187993597984314,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,524288,0.03026432037353516,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,1048576,0.026684160232543948,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,1048576,0.029560639858245853,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,2097152,0.03935679912567139,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,2097152,0.0420636796951294,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,4194304,0.053768639564514165,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,4194304,0.05206048011779785,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,8388608,0.08254912376403808,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,8388608,0.08044896125793458,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,16777216,0.1236790370941162,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,16777216,0.1344038391113281,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,33554432,0.18694656372070312,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,33554432,0.21075136184692383,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,67108864,0.3525894546508789,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,67108864,0.39588031768798826,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,134217728,0.6778566741943359,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,134217728,0.7609523010253907,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,268435456,1.2988079833984376,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,268435456,1.4669769287109375,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,536870912,2.527637786865234,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,536870912,2.8567645263671873,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,128,0.007244799733161926,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,128,0.01963104009628296,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,256,0.0071619200706481935,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,256,0.020186240673065188,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,512,0.006991040110588073,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,512,0.02018079996109009,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,1024,0.007041280269622803,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,1024,0.01894528031349182,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,2048,0.007406719923019408,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,2048,0.018863680362701415,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,4096,0.007519680261611939,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,4096,0.01926527976989746,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,8192,0.00782751977443695,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,8192,0.019362879991531374,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,16384,0.008115839958190919,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,16384,0.020252799987792967,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,32768,0.008632959723472595,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,32768,0.019585280418395995,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,65536,0.009413440227508545,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,65536,0.020013759136199953,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,131072,0.025461759567260746,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,131072,0.035606720447540284,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,262144,0.02571903944015503,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,262144,0.03636831998825073,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,524288,0.031100800037384035,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,524288,0.03323040008544922,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,1048576,0.03473056077957153,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,1048576,0.03723423957824707,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,2097152,0.05745408058166503,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,2097152,0.057390718460083014,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,4194304,0.07909984111785888,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,4194304,0.07486559867858886,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,8388608,0.1097548770904541,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,8388608,0.10686495780944824,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,16777216,0.1706617546081543,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,16777216,0.1765542411804199,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,33554432,0.2775353622436524,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,33554432,0.2882172775268555,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,67108864,0.39627201080322266,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,67108864,0.42362174987792967,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,134217728,0.713391342163086,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,134217728,0.7866019439697266,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,268435456,1.3390396118164063,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,268435456,1.5032421875000002,vllm_eager
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,536870912,2.6077416992187503,vllm_graph
vLLM,0.14.1.dev1+gd68209402,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,536870912,2.931562194824219,vllm_eager
