framework,version,device,op_name,kernel_source,allreduce_dtype,num_gpus,message_size,latency,backend
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,128,0.0042835199832916265,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,128,0.021489601135253906,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,256,0.0042847999930381775,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,256,0.02131903886795044,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,512,0.004293760061264038,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,512,0.021304960250854495,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,1024,0.004275520145893097,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,1024,0.02111743927001953,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,2048,0.004317759871482849,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,2048,0.021187839508056642,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,4096,0.004423039853572845,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,4096,0.02122335910797119,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,8192,0.004440320134162902,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,8192,0.02100895881652832,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,16384,0.0044975998997688294,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,16384,0.02035520076751709,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,32768,0.004590719938278198,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,32768,0.02024928092956543,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,65536,0.004799039959907532,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,65536,0.02026144027709961,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,131072,0.005125439763069153,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,131072,0.020229759216308593,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,262144,0.006257280111312866,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,262144,0.021172161102294924,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,524288,0.008392959833145142,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,524288,0.020858240127563477,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,1048576,0.012450560331344604,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,1048576,0.02031327962875366,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,2097152,0.02027168035507202,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,2097152,0.027583999633789064,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,4194304,0.049983038902282714,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,4194304,0.05664351940155029,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,8388608,0.0784825611114502,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,8388608,0.09348223686218263,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,16777216,0.13817760467529297,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,16777216,0.1641663932800293,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,33554432,0.24680351257324218,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,33554432,0.2946368026733398,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,67108864,0.46512702941894535,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,67108864,0.5562406539916992,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,134217728,0.8842326354980468,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,134217728,1.0623958587646485,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,268435456,1.6891481018066408,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,268435456,2.038648376464844,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,2,536870912,3.2330221557617187,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,2,536870912,3.9174520874023435,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,128,0.004576640129089355,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,128,0.020132160186767577,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,256,0.004538879990577697,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,256,0.020291519165039063,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,512,0.004565120041370392,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,512,0.020087358951568605,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,1024,0.0045948800444602965,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,1024,0.019947199821472167,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,2048,0.00461984008550644,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,2048,0.020010879039764402,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,4096,0.004793600142002106,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,4096,0.019959360361099243,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,8192,0.004878399968147278,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,8192,0.020268480777740478,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,16384,0.004970239996910096,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,16384,0.01956928014755249,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,32768,0.00531328022480011,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,32768,0.019399679899215698,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,65536,0.0058351999521255495,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,65536,0.019571839570999144,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,131072,0.00709824025630951,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,131072,0.019519360065460206,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,262144,0.011358720064163209,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,262144,0.019457600116729735,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,524288,0.012800320386886596,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,524288,0.01988767981529236,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,1048576,0.01864351987838745,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,1048576,0.02578752040863037,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,2097152,0.03045439958572388,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,2097152,0.04435840129852295,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,4194304,0.06326464176177979,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,4194304,0.06982431888580323,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,8388608,0.10114368438720703,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,8388608,0.1148534393310547,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,16777216,0.17340127944946288,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,16777216,0.2001932716369629,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,33554432,0.3218758392333984,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,33554432,0.371130256652832,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,67108864,0.6104265594482422,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,67108864,0.7069683074951172,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,134217728,1.179632339477539,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,134217728,1.358419189453125,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,268435456,2.3131222534179687,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,268435456,2.667485656738281,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,4,536870912,4.533625183105469,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,4,536870912,5.239871826171875,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,128,0.004746879935264588,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,128,0.04086592197418213,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,256,0.004765760004520416,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,256,0.02100895881652832,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,512,0.0045526400208473206,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,512,0.021052160263061524,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,1024,0.004532159864902496,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,1024,0.0211244797706604,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,2048,0.004647360146045685,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,2048,0.021169919967651368,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,4096,0.004943999946117402,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,4096,0.02125920057296753,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,8192,0.005167999863624572,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,8192,0.02114016056060791,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,16384,0.005441280007362366,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,16384,0.021169281005859374,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,32768,0.00630847990512848,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,32768,0.021146559715270997,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,65536,0.0077203202247619635,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,65536,0.021362240314483645,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,131072,0.014709759950637818,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,131072,0.0261190390586853,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,262144,0.01558784008026123,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,262144,0.047951998710632326,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,524288,0.017256640195846558,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,524288,0.027434558868408204,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,1048576,0.020896000862121584,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,1048576,0.036097919940948485,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,2097152,0.03449408054351807,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,2097152,0.04335328102111816,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,4194304,0.07725759983062744,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,4194304,0.08153759956359863,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,8388608,0.1217529582977295,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,8388608,0.13970144271850587,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,16777216,0.21123935699462892,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,16777216,0.24104352951049807,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,33554432,0.36154464721679686,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,33554432,0.4109052658081055,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,67108864,0.6975468444824219,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,67108864,0.7845568084716797,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,134217728,1.3451005554199218,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,134217728,1.5257682800292969,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,268435456,2.6321661376953123,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,268435456,2.9897009277343747,vllm_eager
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_graph,float16,8,536870912,5.194132690429687,vllm_graph
vLLM,0.14.0,NVIDIA H100 80GB HBM3,all_reduce,vLLM_custom_eager,float16,8,536870912,5.909740600585938,vllm_eager
