framework,version,device,op_name,kernel_source,allreduce_dtype,num_gpus,message_size,latency,backend
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,128,0.007102400064468384,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,128,0.02489664077758789,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,256,0.007404159903526305,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,256,0.02509471893310547,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,512,0.007319679856300354,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,512,0.02509023904800415,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,1024,0.007359359860420227,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,1024,0.02504447937011719,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,2048,0.007413759827613831,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,2048,0.024713919162750245,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,4096,0.007419520020484923,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,4096,0.02469183921813965,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,8192,0.007781440019607544,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,8192,0.02411263942718506,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,16384,0.007820159792900086,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,16384,0.024107201099395754,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,32768,0.008031039834022521,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,32768,0.02432703971862793,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,65536,0.008278719782829284,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,65536,0.024196479320526123,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,131072,0.008201919794082642,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,131072,0.024318718910217287,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,262144,0.010182080268859865,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,262144,0.023921918869018555,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,524288,0.014120960235595703,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,524288,0.025229759216308593,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,1048576,0.0229420804977417,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,1048576,0.031132481098175048,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,2097152,0.04132544040679932,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,2097152,0.04272480010986328,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,4194304,0.046166081428527836,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,4194304,0.04742368221282959,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,8388608,0.05978144168853759,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,8388608,0.06241024017333985,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,16777216,0.09088095664978027,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,16777216,0.10056447982788086,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,33554432,0.15880352020263672,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,33554432,0.1800041580200195,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,67108864,0.28843872070312504,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,67108864,0.32988609313964845,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,134217728,0.5391721725463867,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,134217728,0.6224009704589843,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,268435456,1.0294886779785155,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,268435456,1.2010374450683594,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,2,536870912,1.9823983764648438,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,2,536870912,2.3127037048339845,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,128,0.007661759853363037,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,128,0.025074241161346433,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,256,0.0074988800287246705,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,256,0.02513887882232666,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,512,0.007438719868659974,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,512,0.024822399616241456,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,1024,0.007412160038948059,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,1024,0.025046401023864746,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,2048,0.007671999931335449,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,2048,0.025143039226531983,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,4096,0.0076384001970291136,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,4096,0.024707839488983155,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,8192,0.007962239980697632,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,8192,0.024351680278778078,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,16384,0.008192960023880005,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,16384,0.024185919761657716,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,32768,0.008419200181961059,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,32768,0.03783360004425049,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,65536,0.008646399974822997,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,65536,0.024259519577026368,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,131072,0.00880735993385315,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,131072,0.024364800453186036,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,262144,0.01871808052062988,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,262144,0.02975775957107544,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,524288,0.01936735987663269,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,524288,0.031049599647521974,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,1048576,0.02758687973022461,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,1048576,0.03248447895050049,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,2097152,0.04209792137145996,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,2097152,0.04413568019866944,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,4194304,0.05604351997375488,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,4194304,0.05424511909484864,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,8388608,0.08633152008056641,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,8388608,0.08424415588378906,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,16777216,0.12701151847839356,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,16777216,0.13713248252868654,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,33554432,0.1913190460205078,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,33554432,0.21488319396972658,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,67108864,0.36170272827148436,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,67108864,0.4026780700683593,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,134217728,0.6922694396972656,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,134217728,0.775208969116211,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,268435456,1.3072857666015625,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,268435456,1.4750518798828125,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,4,536870912,2.559060516357422,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,4,536870912,2.8882464599609374,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,128,0.007565119862556457,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,128,0.02688256025314331,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,256,0.007387840151786803,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,256,0.0269596791267395,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,512,0.007372800111770631,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,512,0.027007360458374024,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,1024,0.0073788797855377205,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,1024,0.027080960273742676,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,2048,0.0076921600103378295,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,2048,0.027035839557647705,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,4096,0.007794240117073059,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,4096,0.026406400203704834,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,8192,0.008089280128479004,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,8192,0.025651199817657473,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,16384,0.008442559838294983,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,16384,0.02555583953857422,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,32768,0.008668479919433595,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,32768,0.025733439922332763,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,65536,0.00973695993423462,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,65536,0.02569439888000488,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,131072,0.026166720390319826,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,131072,0.03699039936065674,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,262144,0.02626879930496216,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,262144,0.03683487892150879,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,524288,0.03238464117050171,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,524288,0.03483328104019165,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,1048576,0.03591327905654908,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,1048576,0.0632419204711914,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,2097152,0.0582089614868164,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,2097152,0.05981056213378906,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,4194304,0.0815715217590332,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,4194304,0.07734111785888673,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,8388608,0.11181056022644043,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,8388608,0.11106559753417969,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,16777216,0.17298816680908202,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,16777216,0.18057056427001955,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,33554432,0.27964927673339846,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,33554432,0.29531871795654296,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,67108864,0.398702392578125,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,67108864,0.4385887908935547,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,134217728,0.7300204467773438,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,134217728,0.8135504150390626,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,268435456,1.3768301391601563,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,268435456,1.543873291015625,vllm_eager
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_graph,float16,8,536870912,2.6836126708984374,vllm_graph
vLLM,0.14.1,NVIDIA B200,all_reduce,vLLM_custom_eager,float16,8,536870912,3.0159564208984375,vllm_eager
