framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,1,1,power_law_1.01,0.1897318458557129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,1,1,power_law_1.01,0.30508031845092776
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,1,1,power_law_1.01,0.750271987915039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,1,1,power_law_1.01,0.38577152252197267
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,1,1,power_law_1.01,0.6910809326171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,1,1,power_law_1.01,0.7434438323974609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,1,1,power_law_1.01,0.7402668762207031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,1,1,power_law_1.01,0.6415711975097655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,1,1,power_law_1.01,0.6624556732177734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,1,1,power_law_1.01,0.6682733154296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,1,1,power_law_1.01,0.8073561859130859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,1,1,power_law_1.01,0.8391180419921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,1,1,power_law_1.01,0.9242694091796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,1,1,power_law_1.01,0.9693958282470703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,1,1,power_law_1.01,0.9929920196533203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,1,1,power_law_1.01,1.073450241088867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,1,1,power_law_1.01,1.0611360168457031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,1,1,power_law_1.01,1.4540992736816407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,1,1,power_law_1.01,1.7034342956542967
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,1,1,power_law_1.01,2.3290138244628906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,1,1,power_law_1.01,2.921536560058594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,1,1,power_law_1.01,4.16686279296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,1,1,power_law_1.01,7.66236328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,1,1,power_law_1.01,5.2342333984375005
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,1,1,power_law_1.01,10.564974365234374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,1,1,power_law_1.01,0.17527679443359373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,1,1,power_law_1.01,0.12133824348449707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,1,1,power_law_1.01,15.400571289062501
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,1,1,power_law_1.01,0.3621113586425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,1,1,power_law_1.01,0.35913150787353515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,1,1,power_law_1.01,0.21855167388916014
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,1,1,power_law_1.01,0.36209217071533206
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,1,1,power_law_1.01,0.3835366439819336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,1,1,power_law_1.01,0.35892288208007816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,1,1,power_law_1.01,0.3621644973754883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,1,1,power_law_1.01,0.4327321624755859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,1,1,power_law_1.01,19.967425537109374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,1,1,power_law_1.01,0.41059902191162106
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,1,1,power_law_1.01,0.36614017486572265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,1,1,power_law_1.01,0.47629760742187505
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,1,1,power_law_1.01,25.07781982421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,1,1,power_law_1.01,0.4860646438598633
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,1,1,power_law_1.01,0.4921292877197265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,1,1,power_law_1.01,0.5095840072631835
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,1,1,power_law_1.01,0.5395756912231445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,1,1,power_law_1.01,0.7482502746582032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.01,0.8588390350341797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.01,1.1999712371826172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.01,1.5845747375488282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,1,1,power_law_1.2,0.19704320907592773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,1,1,power_law_1.2,0.28178943634033204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,1,1,power_law_1.2,0.35083713531494143
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,1,1,power_law_1.2,0.6446765136718751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,1,1,power_law_1.2,0.6345209503173829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.01,2.2642451477050782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,1,1,power_law_1.2,0.6985311889648438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,1,1,power_law_1.2,0.6751443481445312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.01,2.8691384887695315
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,1,1,power_law_1.2,0.7425977325439452
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,1,1,power_law_1.2,0.7595513916015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,1,1,power_law_1.2,0.7705990600585937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,1,1,power_law_1.2,0.8177362823486328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,1,1,power_law_1.2,0.8440601348876953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.01,4.2165069580078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,1,1,power_law_1.2,0.9268070220947265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,1,1,power_law_1.2,0.9737535858154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,1,1,power_law_1.2,1.0250252532958986
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,1,1,power_law_1.2,1.099994888305664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,1,1,power_law_1.2,1.1113247680664062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.01,5.477184448242188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,1,1,power_law_1.2,1.4120101928710938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,1,1,power_law_1.2,1.7116601562500002
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,1,1,power_law_1.2,2.283504638671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.01,8.07083740234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,1,1,power_law_1.2,2.912207336425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,1,1,power_law_1.2,4.408550415039063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,1,1,power_law_1.2,5.418507690429688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.01,11.375684814453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,1,1,power_law_1.2,0.12690176010131834
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,1,1,power_law_1.2,0.17216447830200193
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,1,1,power_law_1.2,0.2044550323486328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,1,1,power_law_1.2,0.3641004943847656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,1,1,power_law_1.2,0.3445619201660156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,1,1,power_law_1.2,0.36643070220947266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,1,1,power_law_1.2,0.3631008148193359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,1,1,power_law_1.2,0.3595929718017578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,1,1,power_law_1.2,0.37067905426025394
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,1,1,power_law_1.2,8.067150268554688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,1,1,power_law_1.2,0.39553600311279297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.01,14.088546142578124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,1,1,power_law_1.2,0.4153567886352539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,1,1,power_law_1.2,0.43467647552490235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,1,1,power_law_1.2,0.47597824096679686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,1,1,power_law_1.2,0.49545665740966793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,1,1,power_law_1.2,0.5066592025756835
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,1,1,power_law_1.2,0.5324089431762695
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,1,1,power_law_1.2,0.5673696136474609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,1,1,power_law_1.2,0.7303981018066407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,1,1,power_law_1.2,0.8594226837158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,1,1,power_law_1.2,10.38735595703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,1,1,power_law_1.2,1.2246669006347655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,1,1,power_law_1.2,1.5998393249511718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,1,1,power_law_1.2,2.260728302001953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,1,1,power_law_1.2,2.908314208984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,1,1,power_law_1.2,4.232731628417969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,1,1,power_law_1.2,15.387486572265624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,1,1,power_law_1.2,5.5686883544921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,1,1,power_law_1.01,0.38873279571533204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,1,1,power_law_1.01,0.678094711303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,1,1,power_law_1.01,0.5293478393554688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,1,1,power_law_1.2,8.479889526367188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,1,1,power_law_1.2,20.326802978515623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,1,1,power_law_1.01,1.1372096252441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,1,1,power_law_1.01,1.7856370544433595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,1,1,power_law_1.2,11.209385986328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,1,1,power_law_1.01,1.8741427612304686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,1,1,power_law_1.01,1.9196691894531248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,1,1,power_law_1.01,1.817039337158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,1,1,power_law_1.01,1.8771705627441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,1,1,power_law_1.01,2.013317718505859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,1,1,power_law_1.01,2.097397766113281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,1,1,power_law_1.01,2.121267852783203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,1,1,power_law_1.01,2.3969503784179684
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,1,1,power_law_1.2,24.97411376953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,1,1,power_law_1.01,2.5115525817871096
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,1,1,power_law_1.01,2.5755181884765626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,1,1,power_law_1.2,14.018994140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,1,1,power_law_1.01,2.6851654052734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,1,1,power_law_1.01,3.3181280517578124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,1,1,power_law_1.01,4.341580200195312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,1,1,power_law_1.01,5.390703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,1,1,power_law_1.01,7.701162719726563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,1,1,power_law_1.01,10.195304565429687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,1,1,power_law_1.01,14.701671142578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,1,1,power_law_1.01,0.18935487747192384
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,1,1,power_law_1.01,0.3427257537841797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,1,1,power_law_1.01,0.27449792861938477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,1,1,power_law_1.01,0.6347270584106445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,1,1,power_law_1.01,19.356585693359374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,1,1,power_law_1.01,0.6401010894775391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,1,1,power_law_1.01,0.6450438690185547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,1,1,power_law_1.01,0.6384070587158204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,1,1,power_law_1.01,0.6428358459472656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,1,1,power_law_1.01,0.6523027038574218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,1,1,power_law_1.01,0.6655084991455078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,1,1,power_law_1.01,0.5841958236694336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,1,1,power_law_1.01,0.6595289611816406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,1,1,power_law_1.01,0.6870470428466797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,1,1,power_law_1.01,0.7028070068359374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,1,1,power_law_1.01,0.7217804718017578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,1,1,power_law_1.01,0.788023681640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,1,1,power_law_1.01,0.932666244506836
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,1,1,power_law_1.01,1.2263558197021485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.01,1.4063232421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.01,2.051294708251953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.01,2.5794464111328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.01,3.637790222167969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,1,1,power_law_1.01,30.633151855468746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.01,4.796965026855469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.01,7.167500610351563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.01,9.078754272460937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,1,1,power_law_1.2,0.40041217803955076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,1,1,power_law_1.2,0.47202625274658205
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,1,1,power_law_1.2,0.6189894485473633
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,1,1,power_law_1.2,1.1437567901611327
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,1,1,power_law_1.01,42.1446826171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,1,1,power_law_1.2,1.7144889831542969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.01,13.571286621093751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,1,1,power_law_1.2,1.817084197998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,1,1,power_law_1.2,1.8886483764648438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,1,1,power_law_1.2,1.8790969848632812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,1,1,power_law_1.2,1.9571603393554688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,1,1,power_law_1.2,2.0384326171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,1,1,power_law_1.2,2.10129150390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.01,17.965050048828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,1,1,power_law_1.2,2.158520965576172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,1,1,power_law_1.2,2.227626190185547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,1,1,power_law_1.2,2.5147801208496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,1,1,power_law_1.2,2.5738510131835937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,1,1,power_law_1.2,2.6730227661132813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,1,1,power_law_1.2,3.3003698730468747
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,1,1,power_law_1.2,4.472480773925781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.01,22.564924316406252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,1,1,power_law_1.2,5.387461547851562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,1,1,power_law_1.2,7.76549072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,1,1,power_law_1.2,10.098068237304688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,1,1,power_law_1.01,65.5248779296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,1,1,power_law_1.2,14.80975830078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,1,1,power_law_1.2,19.560194091796877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,1,1,power_law_1.2,0.20472448348999023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,1,1,power_law_1.2,0.24745792388916016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,1,1,power_law_1.2,0.31463232040405276
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,1,1,power_law_1.2,0.5844768142700195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,1,1,power_law_1.2,0.6139494323730469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,1,1,power_law_1.2,0.6436646270751953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,1,1,power_law_1.2,0.6478240203857422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,1,1,power_law_1.2,0.6414329528808593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,1,1,power_law_1.2,0.6578323364257812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,1,1,power_law_1.2,0.6594220733642577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,1,1,power_law_1.2,0.667041244506836
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,1,1,power_law_1.2,30.952976074218746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,1,1,power_law_1.2,0.6710105895996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,1,1,power_law_1.2,0.6742022705078126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,1,1,power_law_1.2,0.7134566497802735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,1,1,power_law_1.2,0.7320191955566406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,1,1,power_law_1.2,0.843544921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,1,1,power_law_1.2,0.9434464263916016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,1,1,power_law_1.01,89.931640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,1,1,power_law_1.2,1.242581787109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,1,1,power_law_1.2,1.4863040161132812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,1,1,power_law_1.2,2.038481903076172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,1,1,power_law_1.2,2.555167999267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,1,1,power_law_1.2,3.6998104858398433
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,1,1,power_law_1.2,4.790085144042969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,1,1,power_law_1.2,42.78185546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,1,1,power_law_1.2,7.119849853515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,1,1,power_law_1.2,9.187699584960937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,1,1,power_law_1.2,13.762640380859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,1,1,power_law_1.01,0.21807104110717773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,1,1,power_law_1.01,111.74120117187499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,1,1,power_law_1.2,18.09655517578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,1,1,power_law_1.01,0.4313375854492188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,1,1,power_law_1.01,1.034493408203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,1,1,power_law_1.2,22.457163085937502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,1,1,power_law_1.01,0.4823308944702148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,1,1,power_law_1.01,3.5155853271484374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,1,1,power_law_1.2,65.9290625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,1,1,power_law_1.01,1.729669189453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,1,1,power_law_1.01,3.6736651611328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,1,1,power_law_1.01,3.8280786132812503
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,1,1,power_law_1.01,2.4026457214355466
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,1,1,power_law_1.01,3.9302606201171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,1,1,power_law_1.01,4.16794189453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,1,1,power_law_1.01,4.424579772949219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,1,1,power_law_1.01,4.6187854003906255
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,1,1,power_law_1.01,5.080127868652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,1,1,power_law_1.01,7.220847778320312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,1,1,power_law_1.01,7.43389892578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,1,1,power_law_1.01,7.838791503906251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,1,1,power_law_1.01,8.999152221679688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,1,1,power_law_1.01,8.52210205078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,1,1,power_law_1.01,10.055189208984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,1,1,power_law_1.2,90.53865234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,1,1,power_law_1.01,11.278211669921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,1,1,power_law_1.01,13.380443115234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,1,1,power_law_1.01,15.733748779296874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,1,1,power_law_1.01,20.71794189453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,1,1,power_law_1.01,0.22644416809082032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,1,1,power_law_1.01,0.13978176116943358
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,1,1,power_law_1.01,25.719772949218747
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,1,1,power_law_1.01,0.2793996810913086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,1,1,power_law_1.01,0.5696633529663087
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,1,1,power_law_1.01,1.873272247314453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,1,1,power_law_1.2,114.175419921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,1,1,power_law_1.01,1.9519250488281252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,1,1,power_law_1.01,2.027937927246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,1,1,power_law_1.01,2.0845126342773437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,1,1,power_law_1.01,2.1747174072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,1,1,power_law_1.01,2.244427490234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,1,1,power_law_1.01,0.940200958251953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,1,1,power_law_1.01,36.123271484374996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,1,1,power_law_1.01,2.2937811279296874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,1,1,power_law_1.01,2.356078643798828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,1,1,power_law_1.01,1.28993408203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,1,1,power_law_1.01,2.6272799682617185
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,1,1,power_law_1.01,2.5909933471679687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,1,1,power_law_1.01,2.8352743530273434
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,1,1,power_law_1.01,2.723585205078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.01,3.5331103515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.01,2.948194580078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.01,3.2439099121093746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.01,4.213567504882812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,1,1,power_law_1.01,46.43181640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.01,4.9094213867187495
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.01,6.247000122070313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,1,1,power_law_1.2,0.4596051025390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.01,7.6850537109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,1,1,power_law_1.2,0.21893375396728515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,1,1,power_law_1.2,0.9346669006347657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,1,1,power_law_1.2,1.4996389770507812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,1,1,power_law_1.2,0.42577663421630857
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.01,11.043975830078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,1,1,power_law_1.01,56.791787109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,1,1,power_law_1.2,3.3980142211914064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,1,1,power_law_1.2,3.6328146362304685
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.01,13.979766845703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,1,1,power_law_1.2,3.7782055664062497
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,1,1,power_law_1.2,3.9169003295898435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,1,1,power_law_1.2,4.210261840820313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,1,1,power_law_1.2,4.504382019042969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.01,16.683931884765624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,1,1,power_law_1.2,2.1259014892578127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,1,1,power_law_1.2,4.785804138183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,1,1,power_law_1.2,5.275546264648438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,1,1,power_law_1.2,7.719931640625001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,1,1,power_law_1.2,8.131959838867187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,1,1,power_law_1.2,7.45855224609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,1,1,power_law_1.2,8.900945434570312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,1,1,power_law_1.2,9.508384399414062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,1,1,power_law_1.2,10.683718261718749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,1,1,power_law_1.2,11.298355712890626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,1,1,power_law_1.2,14.104876708984374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,1,1,power_law_1.2,0.22030464172363282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,1,1,power_law_1.2,0.25454528808593746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,1,1,power_law_1.2,0.516677131652832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,1,1,power_law_1.2,16.5275390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,1,1,power_law_1.2,0.1391744041442871
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,1,1,power_law_1.2,0.8175347137451172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,1,1,power_law_1.2,1.1418867492675782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,1,1,power_law_1.2,1.9305010986328124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,1,1,power_law_1.2,2.0010374450683592
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,1,1,power_law_1.2,21.32369873046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,1,1,power_law_1.2,2.058680267333984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,1,1,power_law_1.2,2.1653561401367187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,1,1,power_law_1.2,1.8134873962402345
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,1,1,power_law_1.2,2.312830047607422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,1,1,power_law_1.2,26.648068847656248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,1,1,power_law_1.2,2.4193177795410157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,1,1,power_law_1.2,2.7462283325195314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,1,1,power_law_1.2,2.827135314941406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,1,1,power_law_1.2,2.2529338073730467
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,1,1,power_law_1.2,3.0127713012695314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,1,1,power_law_1.2,2.6673074340820313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,1,1,power_law_1.2,3.152141418457031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,1,1,power_law_1.2,3.4694616699218748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,1,1,power_law_1.2,4.414496765136719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,1,1,power_law_1.2,36.972529296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,1,1,power_law_1.2,5.164537353515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,1,1,power_law_1.2,3.7317919921875005
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,1,1,power_law_1.2,6.470063476562499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,1,1,power_law_1.2,8.073661499023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,1,1,power_law_1.2,11.2725830078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,1,1,power_law_1.2,47.4785546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,1,1,power_law_1.01,0.043919358253479
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,1,1,power_law_1.01,0.05213056087493897
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,1,1,power_law_1.2,14.251114501953126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,1,1,power_law_1.01,0.08347455978393555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,1,1,power_law_1.01,0.27314432144165035
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,1,1,power_law_1.2,16.988542480468748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,1,1,power_law_1.01,0.2471897506713867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,1,1,power_law_1.01,0.3018182373046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,1,1,power_law_1.01,0.29634496688842776
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,1,1,power_law_1.01,0.2931404876708984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,1,1,power_law_1.01,0.12433535575866698
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,1,1,power_law_1.01,0.32131393432617184
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,1,1,power_law_1.01,0.1670604705810547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,1,1,power_law_1.01,0.3163430404663086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,1,1,power_law_1.01,0.3249926376342773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,1,1,power_law_1.2,58.02583984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,1,1,power_law_1.01,0.4255859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,1,1,power_law_1.01,0.35232574462890626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,1,1,power_law_1.01,0.478642578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,1,1,power_law_1.01,0.3837356948852539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,1,1,power_law_1.01,0.3516275024414063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,1,1,power_law_1.01,0.36350849151611325
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,1,1,power_law_1.01,0.3869670486450195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,1,1,power_law_1.01,0.7062822723388672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,1,1,power_law_1.01,0.8969945526123047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,1,1,power_law_1.01,1.199445114135742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,1,1,power_law_1.01,0.5653747177124023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,1,1,power_law_1.01,1.5226086425781251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,1,1,power_law_1.01,0.10466943740844728
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,1,1,power_law_1.01,0.15313088417053222
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,1,1,power_law_1.01,2.188629150390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,1,1,power_law_1.01,0.16849279403686523
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,1,1,power_law_1.01,0.17497472763061522
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,1,1,power_law_1.01,0.17873023986816405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,1,1,power_law_1.01,0.17945856094360352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,1,1,power_law_1.01,0.18510528564453127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,1,1,power_law_1.01,2.82525634765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,1,1,power_law_1.01,0.2110732841491699
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,1,1,power_law_1.01,0.21202432632446291
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,1,1,power_law_1.01,0.22024255752563476
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,1,1,power_law_1.01,0.22428096771240233
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,1,1,power_law_1.01,0.03562432050704956
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,1,1,power_law_1.01,0.22643199920654297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,1,1,power_law_1.01,3.443287048339844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,1,1,power_law_1.01,0.23803647994995117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,1,1,power_law_1.01,0.08337151527404785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,1,1,power_law_1.01,0.25372991561889646
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,1,1,power_law_1.01,0.27411264419555664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,1,1,power_law_1.01,0.3155724716186524
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,1,1,power_law_1.01,0.3718489456176758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,1,1,power_law_1.01,0.47010944366455076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,1,1,power_law_1.01,0.04293439865112304
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,1,1,power_law_1.01,0.5670355224609376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,1,1,power_law_1.01,0.8001734161376953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,1,1,power_law_1.01,1.0229708862304687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,1,1,power_law_1.2,0.07371903896331787
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,1,1,power_law_1.01,1.4587936401367188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,1,1,power_law_1.01,1.9087117004394532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,1,1,power_law_1.01,0.06441664218902587
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,1,1,power_law_1.01,2.3670162963867187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,1,1,power_law_1.2,0.046774401664733886
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,1,1,power_law_1.2,0.29033536911010743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,1,1,power_law_1.2,0.3094572830200195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,1,1,power_law_1.2,0.32154945373535154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,1,1,power_law_1.2,0.2528492736816406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,1,1,power_law_1.2,0.33445953369140624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,1,1,power_law_1.2,0.1448639965057373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,1,1,power_law_1.2,0.04263423919677735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,1,1,power_law_1.2,0.27993600845336913
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,1,1,power_law_1.2,0.10774847984313965
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,1,1,power_law_1.2,0.2979340744018555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,1,1,power_law_1.2,0.3024646377563477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,1,1,power_law_1.2,0.43466625213623045
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,1,1,power_law_1.2,0.4997734451293946
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,1,1,power_law_1.2,0.3544025421142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,1,1,power_law_1.2,0.3854751968383789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,1,1,power_law_1.2,0.5724499130249023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,1,1,power_law_1.2,0.7359986877441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,1,1,power_law_1.2,0.8892192077636718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,1,1,power_law_1.2,0.3539379119873047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,1,1,power_law_1.2,1.179401626586914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,1,1,power_law_1.2,0.369667854309082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,1,1,power_law_1.2,0.04239232063293457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,1,1,power_law_1.2,0.05921984195709229
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,1,1,power_law_1.2,1.5537542724609374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,1,1,power_law_1.2,0.3897260665893555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,1,1,power_law_1.2,0.07720831871032716
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,1,1,power_law_1.2,0.09835647583007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,1,1,power_law_1.2,0.15691264152526857
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,1,1,power_law_1.2,0.17077312469482422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,1,1,power_law_1.2,0.17663040161132812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,1,1,power_law_1.2,0.1802105522155762
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,1,1,power_law_1.2,2.1802828979492186
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,1,1,power_law_1.2,0.18135040283203124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,1,1,power_law_1.2,0.18578176498413085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,1,1,power_law_1.2,0.2144339179992676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,1,1,power_law_1.2,0.21364095687866208
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,1,1,power_law_1.2,0.2231782341003418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,1,1,power_law_1.2,0.22832767486572267
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,1,1,power_law_1.2,0.23127168655395508
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,1,1,power_law_1.2,0.24361663818359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,1,1,power_law_1.2,0.25512256622314455
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,1,1,power_law_1.2,2.8660910034179685
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,1,1,power_law_1.2,0.2805747222900391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,1,1,power_law_1.2,0.32752769470214843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,1,1,power_law_1.2,0.37476287841796874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,1,1,power_law_1.2,3.4529010009765626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,1,1,power_law_1.2,0.47256961822509763
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,1,1,power_law_1.2,0.5770016098022461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,1,1,power_law_1.2,0.8042495727539063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,1,1,power_law_1.2,1.0127251434326172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,1,1,power_law_1.01,0.1307161617279053
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,1,1,power_law_1.01,0.25850496292114256
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,1,1,power_law_1.01,0.4108243179321289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,1,1,power_law_1.2,1.4719052124023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,1,1,power_law_1.01,0.5477990341186524
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,1,1,power_law_1.2,0.03726144075393677
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,1,1,power_law_1.2,1.920791015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,1,1,power_law_1.01,0.9186431884765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,1,1,power_law_1.01,1.006131820678711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,1,1,power_law_1.2,2.3591276550292966
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,1,1,power_law_1.01,1.0371084594726563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,1,1,power_law_1.01,1.0757901000976564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,1,1,power_law_1.01,1.0899353790283204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,1,1,power_law_1.01,1.1601203155517577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,1,1,power_law_1.01,1.7051744079589846
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,1,1,power_law_1.01,1.720740509033203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,1,1,power_law_1.01,1.7944717407226562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,1,1,power_law_1.01,0.10037247657775879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,1,1,power_law_1.01,1.8631814575195313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,1,1,power_law_1.01,1.8822476196289064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,1,1,power_law_1.01,1.9815026855468751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,1,1,power_law_1.01,2.1320326232910154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,1,1,power_law_1.01,2.2999641418457033
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,1,1,power_law_1.01,2.7357708740234377
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,1,1,power_law_1.01,3.259367065429687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,1,1,power_law_1.01,4.297936706542968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,1,1,power_law_1.01,0.09220031738281251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,1,1,power_law_1.01,5.362412109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,1,1,power_law_1.01,0.14952704429626465
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,1,1,power_law_1.01,0.21970176696777344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,1,1,power_law_1.01,0.29137855529785156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,1,1,power_law_1.01,0.4719827270507812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,1,1,power_law_1.01,0.06860415935516358
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,1,1,power_law_1.01,7.558972778320313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,1,1,power_law_1.01,0.5239251327514649
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,1,1,power_law_1.01,0.5423590469360351
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,1,1,power_law_1.01,0.5556121444702148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,1,1,power_law_1.01,0.5636428833007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,1,1,power_law_1.01,0.5778355026245118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,1,1,power_law_1.01,0.6410316467285156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,1,1,power_law_1.01,0.6461074829101563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,1,1,power_law_1.01,0.6747347259521485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,1,1,power_law_1.01,0.6785990142822266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,1,1,power_law_1.01,9.965159912109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,1,1,power_law_1.01,0.6838784027099609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,1,1,power_law_1.01,0.7036608123779298
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,1,1,power_law_1.01,0.7693427276611329
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.01,0.8008025360107421
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.01,0.9504531097412109
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.01,1.1654259490966798
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.01,1.4597305297851562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.01,1.84388671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.01,2.4824281311035157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,1,1,power_law_1.01,14.369240722656249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,1,1,power_law_1.2,0.10648768424987794
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.01,3.16857666015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,1,1,power_law_1.2,0.1132192039489746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,1,1,power_law_1.2,0.241213436126709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,1,1,power_law_1.2,0.3611743927001953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,1,1,power_law_1.2,0.49378494262695316
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.01,4.501693420410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,1,1,power_law_1.2,0.9415711975097656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,1,1,power_law_1.2,1.0237913513183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,1,1,power_law_1.2,1.0592697906494142
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.01,5.742472534179687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,1,1,power_law_1.2,1.1031302642822265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,1,1,power_law_1.2,1.1095014190673829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,1,1,power_law_1.2,1.1674604797363282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,1,1,power_law_1.01,18.683707275390624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,1,1,power_law_1.2,1.7334010314941406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,1,1,power_law_1.2,1.7458201599121093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.01,7.210176391601562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,1,1,power_law_1.2,1.8338616943359376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,1,1,power_law_1.2,1.8944281005859374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,1,1,power_law_1.2,1.9163999938964842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,1,1,power_law_1.2,2.0150912475585936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,1,1,power_law_1.2,2.1787033081054688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,1,1,power_law_1.2,2.3338688659667968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,1,1,power_law_1.2,2.8736224365234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,1,1,power_law_1.01,23.03049072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,1,1,power_law_1.2,3.3165402221679683
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,1,1,power_law_1.2,0.07306623935699463
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,1,1,power_law_1.2,4.354974060058593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,1,1,power_law_1.2,0.07978879928588867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,1,1,power_law_1.2,0.1361894416809082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,1,1,power_law_1.2,0.19806655883789062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,1,1,power_law_1.2,5.433156127929688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,1,1,power_law_1.2,0.26577407836914063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,1,1,power_law_1.2,0.4876383972167969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,1,1,power_law_1.2,0.5334995269775391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,1,1,power_law_1.2,0.5501708984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,1,1,power_law_1.2,0.5659699249267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,1,1,power_law_1.2,0.5683232116699218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,1,1,power_law_1.2,0.5818636703491211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,1,1,power_law_1.2,7.734810791015624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,1,1,power_law_1.2,0.6542131042480468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,1,1,power_law_1.2,0.6575615692138672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,1,1,power_law_1.2,0.6774105834960937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,1,1,power_law_1.2,0.7092652893066406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,1,1,power_law_1.2,0.6981394958496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,1,1,power_law_1.2,0.7215411376953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,1,1,power_law_1.2,0.7830931091308594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,1,1,power_law_1.2,0.8655718231201173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,1,1,power_law_1.2,10.029349365234376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,1,1,power_law_1.2,1.0105228424072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,1,1,power_law_1.2,1.1762809753417969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,1,1,power_law_1.2,1.4946823120117188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,1,1,power_law_1.2,1.836815948486328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,1,1,power_law_1.2,2.500540771484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,1,1,power_law_1.2,3.182996520996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,1,1,power_law_1.2,14.3170263671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,1,1,power_law_1.01,0.3746451187133789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,1,1,power_law_1.01,0.2206208038330078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,1,1,power_law_1.2,4.495488586425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,1,1,power_law_1.01,1.0299910736083984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,1,1,power_law_1.01,1.477550048828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,1,1,power_law_1.2,5.787454833984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,1,1,power_law_1.01,0.5645369720458985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,1,1,power_law_1.01,2.5553747558593747
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,1,1,power_law_1.2,18.800657958984374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,1,1,power_law_1.01,2.8008511352539065
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,1,1,power_law_1.2,7.272529907226563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,1,1,power_law_1.01,2.967523193359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,1,1,power_law_1.01,3.1278546142578127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,1,1,power_law_1.01,3.208587646484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,1,1,power_law_1.01,3.4158584594726564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,1,1,power_law_1.01,3.6980941772460936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,1,1,power_law_1.2,23.3718017578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,1,1,power_law_1.01,5.326831665039062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,1,1,power_law_1.01,5.451190795898437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,1,1,power_law_1.01,5.696498413085938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,1,1,power_law_1.01,5.826233520507812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,1,1,power_law_1.01,6.141153564453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,1,1,power_law_1.01,6.754859008789063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,1,1,power_law_1.01,7.1223559570312505
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,1,1,power_law_1.01,7.9837060546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,1,1,power_law_1.01,9.519234619140624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,1,1,power_law_1.01,0.14424448013305663
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,1,1,power_law_1.01,0.20797183990478513
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,1,1,power_law_1.01,11.977291259765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,1,1,power_law_1.01,0.3096326446533203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,1,1,power_law_1.01,0.5629862213134766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,1,1,power_law_1.01,0.80408447265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,1,1,power_law_1.01,14.578563232421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,1,1,power_law_1.01,1.3779866027832033
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,1,1,power_law_1.01,1.4994598388671876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,1,1,power_law_1.01,1.5808493041992189
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,1,1,power_law_1.01,1.6384442138671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,1,1,power_law_1.01,1.6723577880859373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,1,1,power_law_1.01,1.711946258544922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,1,1,power_law_1.01,1.7530931091308595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,1,1,power_law_1.01,1.8907058715820313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,1,1,power_law_1.01,20.113619384765624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,1,1,power_law_1.01,1.9037081909179687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,1,1,power_law_1.01,1.9671589660644533
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,1,1,power_law_1.01,1.9717779541015623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,1,1,power_law_1.01,2.0517984008789063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,1,1,power_law_1.01,2.188426208496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.01,2.322746887207031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,1,1,power_law_1.01,25.343012695312503
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.01,2.537806091308594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.01,3.0032473754882814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.01,3.6750106811523438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.01,4.435633850097656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.01,5.929212646484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.01,7.5261383056640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,1,1,power_law_1.2,0.28825855255126953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,1,1,power_law_1.2,0.2261190414428711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,1,1,power_law_1.2,0.5389702224731445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,1,1,power_law_1.2,0.897558364868164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,1,1,power_law_1.01,36.523525390625004
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,1,1,power_law_1.2,1.275541763305664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.01,11.054642333984376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,1,1,power_law_1.2,2.539271697998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,1,1,power_law_1.2,2.821405944824219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,1,1,power_law_1.2,3.033870849609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,1,1,power_law_1.2,3.204744262695313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.01,14.1219384765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,1,1,power_law_1.2,3.338446044921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,1,1,power_law_1.2,3.552162475585938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,1,1,power_law_1.2,3.8086508178710936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.01,16.97937744140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,1,1,power_law_1.2,5.575120239257812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,1,1,power_law_1.2,5.689950561523437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,1,1,power_law_1.01,48.155693359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,1,1,power_law_1.2,5.9679443359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,1,1,power_law_1.2,6.123601684570312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,1,1,power_law_1.2,6.344364624023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,1,1,power_law_1.2,6.795221557617188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,1,1,power_law_1.2,7.161090087890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,1,1,power_law_1.2,8.375265502929688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,1,1,power_law_1.2,9.474923095703124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,1,1,power_law_1.01,59.6334375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,1,1,power_law_1.2,12.369254150390626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,1,1,power_law_1.2,0.1615884780883789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,1,1,power_law_1.2,0.30056320190429686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,1,1,power_law_1.2,14.904766845703126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,1,1,power_law_1.2,0.49745151519775394
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,1,1,power_law_1.2,0.6968281555175782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,1,1,power_law_1.2,1.3606335449218752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,1,1,power_law_1.2,1.5066911315917968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,1,1,power_law_1.2,1.6150579833984373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,1,1,power_law_1.2,20.279058837890624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,1,1,power_law_1.2,1.6639520263671876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,1,1,power_law_1.2,0.14347968101501465
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,1,1,power_law_1.2,1.666735382080078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,1,1,power_law_1.2,1.755018310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,1,1,power_law_1.2,1.7843154907226562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,1,1,power_law_1.2,1.940782012939453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,1,1,power_law_1.2,1.979584655761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,1,1,power_law_1.2,2.0313075256347655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,1,1,power_law_1.2,2.0569638061523436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,1,1,power_law_1.2,2.137518005371094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,1,1,power_law_1.2,2.2347514343261716
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,1,1,power_law_1.2,25.96329345703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,1,1,power_law_1.2,2.3579507446289063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,1,1,power_law_1.2,2.6975021362304688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,1,1,power_law_1.2,3.0511294555664064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,1,1,power_law_1.2,3.777277526855469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,1,1,power_law_1.2,4.536312255859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,1,1,power_law_1.2,5.996670532226562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,1,1,power_law_1.2,7.475218505859376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,1,1,power_law_1.01,0.2518623924255371
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,1,1,power_law_1.01,0.4720185470581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,1,1,power_law_1.2,38.06991455078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,1,1,power_law_1.01,0.7254086303710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,1,1,power_law_1.2,11.175924072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,1,1,power_law_1.01,0.9095859527587891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,1,1,power_law_1.01,2.081092529296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,1,1,power_law_1.01,2.9590853881835937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,1,1,power_law_1.2,14.0160986328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,1,1,power_law_1.01,3.5271044921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,1,1,power_law_1.01,4.695076599121093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,1,1,power_law_1.2,17.00081298828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,1,1,power_law_1.01,5.0297131347656245
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,1,1,power_law_1.01,5.22618896484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,1,1,power_law_1.01,5.470170288085937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,1,1,power_law_1.01,5.6628961181640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,1,1,power_law_1.2,50.6875634765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,1,1,power_law_1.01,5.939630737304688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,1,1,power_law_1.01,6.379244995117188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,1,1,power_law_1.01,6.910768432617187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,1,1,power_law_1.01,7.281939086914062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,1,1,power_law_1.01,10.37630615234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,1,1,power_law_1.01,11.211689453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,1,1,power_law_1.01,11.99723388671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,1,1,power_law_1.2,63.31108886718751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,1,1,power_law_1.01,13.268598632812502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,1,1,power_law_1.01,14.401622314453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,1,1,power_law_1.01,0.16059648513793945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,1,1,power_law_1.01,16.414567871093748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,1,1,power_law_1.01,0.24623424530029298
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,1,1,power_law_1.01,0.41386497497558594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,1,1,power_law_1.01,0.5033375930786133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,1,1,power_law_1.01,18.367788085937498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,1,1,power_law_1.01,1.0873363494873047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,1,1,power_law_1.01,1.5984384155273437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,1,1,power_law_1.01,1.8860870361328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,1,1,power_law_1.01,2.507176971435547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,1,1,power_law_1.01,2.6683578491210938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,1,1,power_law_1.01,2.775420837402344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,1,1,power_law_1.01,22.89610595703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,1,1,power_law_1.01,2.892445373535156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,1,1,power_law_1.01,2.9723794555664065
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,1,1,power_law_1.01,3.0529266357421876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,1,1,power_law_1.01,3.1539239501953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,1,1,power_law_1.01,28.29615478515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,1,1,power_law_1.01,3.2355526733398436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,1,1,power_law_1.01,3.2960101318359376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,1,1,power_law_1.01,3.7041567993164066
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,1,1,power_law_1.01,3.8424475097656248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.01,4.00931396484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.01,4.322364807128906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.01,4.574593200683593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.01,5.265708618164062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.01,5.88892822265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,1,1,power_law_1.01,38.67859130859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.01,7.268355102539063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,1,1,power_law_1.2,0.47220798492431637
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.01,9.166373291015626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,1,1,power_law_1.2,0.5697119903564454
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,1,1,power_law_1.2,0.2413747215270996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,1,1,power_law_1.2,0.9752301025390626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,1,1,power_law_1.2,1.7127635192871093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.01,12.189884033203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,1,1,power_law_1.2,2.6285345458984373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,1,1,power_law_1.01,49.1872998046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,1,1,power_law_1.2,3.1291595458984376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.01,15.183162841796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,1,1,power_law_1.2,4.461912841796876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,1,1,power_law_1.2,4.744423828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,1,1,power_law_1.2,5.017201843261718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,1,1,power_law_1.2,5.355864868164063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.01,17.7076953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,1,1,power_law_1.2,5.645017700195313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,1,1,power_law_1.01,58.951137695312504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,1,1,power_law_1.2,5.869688720703126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,1,1,power_law_1.2,6.414902954101562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,1,1,power_law_1.2,6.925260009765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,1,1,power_law_1.2,7.506859130859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,1,1,power_law_1.2,10.5024609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,1,1,power_law_1.2,11.441927490234374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,1,1,power_law_1.2,12.321142578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,1,1,power_law_1.2,13.590554199218749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,1,1,power_law_1.2,15.087205810546873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,1,1,power_law_1.2,0.1607948875427246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,1,1,power_law_1.2,17.28933837890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,1,1,power_law_1.2,0.2461305618286133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,1,1,power_law_1.2,0.3258182525634766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,1,1,power_law_1.2,0.5108607864379883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,1,1,power_law_1.2,19.653699951171877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,1,1,power_law_1.2,0.9349388885498048
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,1,1,power_law_1.2,1.415594940185547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,1,1,power_law_1.2,1.6751756286621096
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,1,1,power_law_1.2,2.376719970703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,1,1,power_law_1.2,24.6552001953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,1,1,power_law_1.2,2.526042175292969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,1,1,power_law_1.2,2.651341552734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,1,1,power_law_1.2,2.8115640258789063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,1,1,power_law_1.2,2.90762939453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,1,1,power_law_1.2,2.976538391113281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,1,1,power_law_1.2,3.1036218261718753
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,1,1,power_law_1.2,3.190882568359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,1,1,power_law_1.2,29.922512207031254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,1,1,power_law_1.2,3.2930029296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,1,1,power_law_1.2,3.707824096679688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,1,1,power_law_1.2,3.935733642578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,1,1,power_law_1.2,4.16445068359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,1,1,power_law_1.2,4.5482635498046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,1,1,power_law_1.2,4.849620971679688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,1,1,power_law_1.2,5.594185180664063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,1,1,power_law_1.2,6.288095703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,1,1,power_law_1.2,39.42294189453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,1,1,power_law_1.2,7.742226562499999
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,2,1,power_law_1.01,0.11430848121643067
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,1,1,power_law_1.2,9.877214965820311
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,2,1,power_law_1.01,0.2129759979248047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,1,1,power_law_1.2,12.838808593749999
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,2,1,power_law_1.01,0.18255231857299806
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,2,1,power_law_1.01,0.36611774444580075
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,1,1,power_law_1.2,50.5093505859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,1,1,power_law_1.2,15.55731689453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,2,1,power_law_1.01,0.3489606475830078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,2,1,power_law_1.01,0.38949119567871093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,2,1,power_law_1.01,0.4225056076049805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,2,1,power_law_1.01,0.3899302291870117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,2,1,power_law_1.01,0.4542489624023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,2,1,power_law_1.01,0.4835744094848633
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,2,1,power_law_1.01,0.5060710525512695
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,2,1,power_law_1.01,0.5052972793579101
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,2,1,power_law_1.01,0.4123660659790039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,2,1,power_law_1.01,0.44577152252197266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,1,1,power_law_1.2,17.99011474609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,2,1,power_law_1.01,0.3575462341308594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,2,1,power_law_1.01,1.0946195220947266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,2,1,power_law_1.01,1.4399378967285155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,2,1,power_law_1.01,0.525912971496582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,2,1,power_law_1.01,0.543262710571289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,2,1,power_law_1.01,0.7235609436035156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,1,1,power_law_1.2,60.5048095703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,2,1,power_law_1.01,0.8516998291015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,2,1,power_law_1.01,2.116204833984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,2,1,power_law_1.01,2.704210510253906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,2,1,power_law_1.01,3.85716552734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,2,1,power_law_1.01,0.0734611177444458
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,2,1,power_law_1.01,0.12423680305480958
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,2,1,power_law_1.01,5.030768127441407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,2,1,power_law_1.01,0.1962937545776367
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,2,1,power_law_1.01,0.19751039505004883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,2,1,power_law_1.01,0.10558015823364257
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,2,1,power_law_1.01,7.532588500976563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,2,1,power_law_1.01,0.2000992012023926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,2,1,power_law_1.01,0.20230144500732422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,2,1,power_law_1.01,10.286809082031251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,2,1,power_law_1.01,0.19992319107055664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,2,1,power_law_1.01,12.663380126953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,2,1,power_law_1.01,0.20086528778076174
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,2,1,power_law_1.01,0.21061952590942382
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,2,1,power_law_1.01,0.39268672943115235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.01,0.4421715164184571
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,2,1,power_law_1.01,0.22853887557983396
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,2,1,power_law_1.01,0.22739391326904296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,2,1,power_law_1.01,0.23731456756591798
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,2,1,power_law_1.01,0.2523859214782715
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.01,1.1814508819580078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.01,1.4788876342773438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,2,1,power_law_1.01,0.2726016044616699
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.01,2.178503723144531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,2,1,power_law_1.01,0.28378944396972655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.01,2.8756506347656248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.01,4.183356018066407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,2,1,power_law_1.01,0.29616832733154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,2,1,power_law_1.2,0.34327552795410154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.01,5.4814404296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,2,1,power_law_1.2,0.10844351768493651
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.01,0.6077824020385743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.01,0.800738525390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.01,7.294268798828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,2,1,power_law_1.2,0.44873790740966796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,2,1,power_law_1.2,0.19093120574951172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,2,1,power_law_1.2,0.3825593566894531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,2,1,power_law_1.2,0.4794099044799805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,2,1,power_law_1.2,0.4930380630493164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,2,1,power_law_1.2,0.1554758358001709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,2,1,power_law_1.2,0.515344009399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,2,1,power_law_1.2,0.5447993469238281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,2,1,power_law_1.2,0.3333395385742187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,2,1,power_law_1.2,0.5481708908081055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,2,1,power_law_1.2,0.3971551895141602
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,2,1,power_law_1.2,0.7215724945068359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,2,1,power_law_1.2,0.8600038146972656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,2,1,power_law_1.2,0.35673728942871097
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,2,1,power_law_1.2,1.1823897552490235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,2,1,power_law_1.2,0.4115449523925781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,2,1,power_law_1.2,1.4114988708496095
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,2,1,power_law_1.2,0.4252441787719727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,2,1,power_law_1.2,0.4370636749267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,2,1,power_law_1.2,3.8703231811523438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,2,1,power_law_1.2,5.095848388671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,2,1,power_law_1.2,0.07372032165527344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,2,1,power_law_1.2,2.150609893798828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,2,1,power_law_1.2,2.669613952636719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,2,1,power_law_1.2,10.294779052734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,2,1,power_law_1.2,0.11400896072387696
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,2,1,power_law_1.2,12.86595703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,2,1,power_law_1.2,0.207696647644043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,2,1,power_law_1.2,0.19009408950805665
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,2,1,power_law_1.2,0.21486528396606444
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,2,1,power_law_1.2,0.22864448547363284
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,2,1,power_law_1.2,0.09889599800109863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,2,1,power_law_1.2,0.2339206314086914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,2,1,power_law_1.2,0.23409343719482423
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,2,1,power_law_1.2,0.2501318359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,2,1,power_law_1.2,0.27014976501464844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,2,1,power_law_1.2,0.1969696044921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,2,1,power_law_1.2,7.446795043945312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,2,1,power_law_1.2,0.38212032318115235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,2,1,power_law_1.2,0.1998387145996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,2,1,power_law_1.2,0.4454681777954102
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,2,1,power_law_1.2,0.6043571090698242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,2,1,power_law_1.2,0.8174553680419923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,2,1,power_law_1.2,0.2027225685119629
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,2,1,power_law_1.2,1.1595903778076173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,2,1,power_law_1.2,0.19917695999145507
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,2,1,power_law_1.2,1.4581817626953124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,2,1,power_law_1.01,0.18963327407836914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,2,1,power_law_1.01,0.29923391342163086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,2,1,power_law_1.2,2.3309945678710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,2,1,power_law_1.01,0.3769196701049805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,2,1,power_law_1.2,2.8612933349609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,2,1,power_law_1.01,0.9083052825927733
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,2,1,power_law_1.2,0.28991487503051755
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,2,1,power_law_1.01,0.9205606079101563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,2,1,power_law_1.2,4.1610546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,2,1,power_law_1.01,0.6053337478637696
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,2,1,power_law_1.01,0.9509855651855469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,2,1,power_law_1.01,0.939151382446289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,2,1,power_law_1.01,0.9594950103759766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,2,1,power_law_1.01,1.0173465728759765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,2,1,power_law_1.01,1.064204788208008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,2,1,power_law_1.01,1.0686278533935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,2,1,power_law_1.2,5.584254150390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,2,1,power_law_1.01,1.1941798400878905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,2,1,power_law_1.01,1.2423296356201172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,2,1,power_law_1.01,1.2706047821044923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,2,1,power_law_1.2,0.2956780815124512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,2,1,power_law_1.01,1.3402310180664063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,2,1,power_law_1.2,6.931000366210938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,2,1,power_law_1.01,1.662434539794922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,2,1,power_law_1.01,2.1281805419921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,2,1,power_law_1.01,2.628394775390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,2,1,power_law_1.01,3.700445556640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,2,1,power_law_1.01,4.815214843750001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,2,1,power_law_1.01,7.01934814453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,2,1,power_law_1.01,9.569354858398437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,2,1,power_law_1.01,0.1016108798980713
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,2,1,power_law_1.01,0.15948543548583985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,2,1,power_law_1.01,13.85715087890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,2,1,power_law_1.01,0.31903743743896484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,2,1,power_law_1.01,0.19178943634033202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,2,1,power_law_1.01,0.30976768493652346
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,2,1,power_law_1.01,0.3117395210266113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,2,1,power_law_1.01,18.369698486328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,2,1,power_law_1.01,0.3272940826416016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,2,1,power_law_1.01,0.31622783660888676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,2,1,power_law_1.01,0.3131923294067383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,2,1,power_law_1.01,0.3650239944458008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,2,1,power_law_1.01,0.3149363136291504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,2,1,power_law_1.01,0.35466880798339845
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,2,1,power_law_1.01,0.35489086151123045
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,2,1,power_law_1.01,0.46173183441162113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,2,1,power_law_1.01,0.602023048400879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.01,0.761886749267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.01,1.3305062866210937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,2,1,power_law_1.01,28.85110595703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.01,1.9094047546386719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,2,1,power_law_1.01,0.3942041778564453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,2,1,power_law_1.01,0.4040057754516601
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.01,2.454510040283203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,2,1,power_law_1.01,0.44456703186035157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.01,3.612074279785156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.01,4.614575500488281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,2,1,power_law_1.2,0.25219135284423827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,2,1,power_law_1.2,0.1851193618774414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.01,1.0342630767822265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,2,1,power_law_1.2,0.36728511810302733
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,2,1,power_law_1.2,0.8622022247314453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,2,1,power_law_1.2,0.9151974487304688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.01,6.820569458007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,2,1,power_law_1.2,0.6035987091064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,2,1,power_law_1.2,0.950219497680664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,2,1,power_law_1.2,0.9388537597656249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,2,1,power_law_1.2,0.9952114868164064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,2,1,power_law_1.2,1.0320159912109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,2,1,power_law_1.2,1.0707756805419923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,2,1,power_law_1.2,1.076248321533203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,2,1,power_law_1.2,1.1098873901367188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,2,1,power_law_1.2,1.2475167846679687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,2,1,power_law_1.2,1.287386932373047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,2,1,power_law_1.2,1.338671417236328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,2,1,power_law_1.01,39.866184082031246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,2,1,power_law_1.2,1.6334585571289062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.01,9.339403686523436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,2,1,power_law_1.2,2.1442828369140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,2,1,power_law_1.2,2.6525299072265627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,2,1,power_law_1.2,3.69711181640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.01,11.795911865234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,2,1,power_law_1.2,4.84903564453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,2,1,power_law_1.2,7.259151000976563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,2,1,power_law_1.2,9.301220092773438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,2,1,power_law_1.01,50.4749169921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,2,1,power_law_1.2,13.650738525390626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,2,1,power_law_1.2,0.14344063758850098
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,2,1,power_law_1.2,0.10151616096496582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,2,1,power_law_1.2,0.31520896911621094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,2,1,power_law_1.2,0.17935167312622072
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,2,1,power_law_1.2,0.31624832153320315
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,2,1,power_law_1.2,0.3079763221740722
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,2,1,power_law_1.2,18.544864501953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,2,1,power_law_1.2,0.3596460723876953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,2,1,power_law_1.2,0.3030054473876953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,2,1,power_law_1.2,0.3660652923583984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,2,1,power_law_1.2,0.3210707092285156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,2,1,power_law_1.2,0.32091712951660156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,2,1,power_law_1.2,0.46722496032714844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,2,1,power_law_1.2,0.475175666809082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,2,1,power_law_1.2,0.6174272155761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,2,1,power_law_1.2,0.7587987518310546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,2,1,power_law_1.2,0.3325414276123047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,2,1,power_law_1.2,0.3603257751464844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,2,1,power_law_1.2,1.2694271850585939
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,2,1,power_law_1.2,1.9157913208007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,2,1,power_law_1.2,2.4161721801757814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,2,1,power_law_1.2,0.39290241241455076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,2,1,power_law_1.2,0.41151168823242185
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,2,1,power_law_1.2,29.35537109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,2,1,power_law_1.2,3.5250253295898437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,2,1,power_law_1.2,4.7293310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,2,1,power_law_1.2,1.0411730957031249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,2,1,power_law_1.01,0.14720383644104004
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,2,1,power_law_1.01,0.23109439849853514
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,2,1,power_law_1.01,0.27444351196289063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,2,1,power_law_1.01,0.5523481750488282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,2,1,power_law_1.01,0.9089568328857421
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,2,1,power_law_1.2,6.802774047851562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,2,1,power_law_1.01,1.2340748596191407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,2,1,power_law_1.01,1.7859225463867188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,2,1,power_law_1.01,1.8737689208984374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,2,1,power_law_1.01,1.9503961181640626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,2,1,power_law_1.01,1.9938674926757813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,2,1,power_law_1.01,2.110113220214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,2,1,power_law_1.01,2.2163655090332033
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,2,1,power_law_1.2,40.5920166015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,2,1,power_law_1.01,2.2913600158691407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,2,1,power_law_1.2,11.3849072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,2,1,power_law_1.01,2.481320343017578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,2,1,power_law_1.01,3.538785400390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,2,1,power_law_1.01,3.6347558593750002
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,2,1,power_law_1.01,3.8300952148437504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,2,1,power_law_1.01,4.158668823242188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,2,1,power_law_1.01,4.413050842285156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,2,1,power_law_1.2,9.104255981445313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,2,1,power_law_1.01,4.997552490234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,2,1,power_law_1.01,5.520528564453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,2,1,power_law_1.2,51.084858398437504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,2,1,power_law_1.01,6.535059204101563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,2,1,power_law_1.01,0.09577664375305175
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,2,1,power_law_1.01,0.13837183952331542
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,2,1,power_law_1.01,7.68761962890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,2,1,power_law_1.01,0.17287551879882812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,2,1,power_law_1.01,0.31205184936523434
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,2,1,power_law_1.01,0.4987891387939453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,2,1,power_law_1.01,0.6750118255615234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,2,1,power_law_1.01,0.9672870635986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,2,1,power_law_1.01,10.66251953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,2,1,power_law_1.01,1.0057516479492188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,2,1,power_law_1.01,1.0448230743408202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,2,1,power_law_1.01,1.0713209533691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,2,1,power_law_1.01,1.118158721923828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,2,1,power_law_1.01,1.1394911956787108
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,2,1,power_law_1.01,1.1705017852783204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,2,1,power_law_1.01,13.23791015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,2,1,power_law_1.01,1.205966110229492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,2,1,power_law_1.01,1.3527673339843749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,2,1,power_law_1.01,1.3838316345214845
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,2,1,power_law_1.01,1.4254534912109373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,2,1,power_law_1.01,1.4950381469726561
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.01,1.5963456726074219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.01,1.7203091430664064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.01,1.9382879638671873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,2,1,power_law_1.01,18.04280517578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.01,2.3081324768066405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.01,2.7116293334960937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,2,1,power_law_1.2,0.14885951995849608
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.01,3.5348718261718752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,2,1,power_law_1.2,0.21496000289916992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,2,1,power_law_1.2,0.2399488067626953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.01,4.308851318359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,2,1,power_law_1.2,0.49809024810791014
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,2,1,power_law_1.2,0.7774079895019531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.01,5.902213745117187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,2,1,power_law_1.2,1.089678726196289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,2,1,power_law_1.01,23.465708007812502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,2,1,power_law_1.2,1.7296832275390623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,2,1,power_law_1.2,1.850110778808594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.01,7.435865478515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,2,1,power_law_1.2,1.9173472595214842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,2,1,power_law_1.2,1.9800997924804686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,2,1,power_law_1.2,2.113870086669922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,2,1,power_law_1.2,2.237391357421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.01,9.596250610351563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,2,1,power_law_1.2,2.3553318786621094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,2,1,power_law_1.2,2.570113220214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,2,1,power_law_1.2,3.641892395019531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,2,1,power_law_1.2,3.7694207763671876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,2,1,power_law_1.01,28.93051025390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,2,1,power_law_1.2,3.968226013183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,2,1,power_law_1.2,4.359914245605468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,2,1,power_law_1.2,4.66110595703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,2,1,power_law_1.2,5.267509765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,2,1,power_law_1.2,5.617833251953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,2,1,power_law_1.2,0.09436991691589355
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,2,1,power_law_1.2,6.8043310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,2,1,power_law_1.2,0.1348697566986084
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,2,1,power_law_1.2,0.16370559692382813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,2,1,power_law_1.2,0.2886323165893555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,2,1,power_law_1.2,8.080956420898437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,2,1,power_law_1.2,0.4411238479614258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,2,1,power_law_1.2,0.6011225509643554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,2,1,power_law_1.2,0.9356832122802734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,2,1,power_law_1.2,0.9893363189697265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,2,1,power_law_1.2,1.0165792083740235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,2,1,power_law_1.2,10.893275146484374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,2,1,power_law_1.2,1.0545536041259767
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,2,1,power_law_1.2,1.0942073822021485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,2,1,power_law_1.2,1.138128662109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,2,1,power_law_1.2,1.1687744140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,2,1,power_law_1.2,13.564864501953124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,2,1,power_law_1.2,1.2235826873779296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,2,1,power_law_1.2,1.3822451782226561
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,2,1,power_law_1.2,1.4396762084960937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,2,1,power_law_1.2,1.4815155029296876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,2,1,power_law_1.2,1.5766355895996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,2,1,power_law_1.2,1.679242858886719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,2,1,power_law_1.2,1.8911744689941408
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,2,1,power_law_1.2,2.0489683532714844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,2,1,power_law_1.2,18.476884765624998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,2,1,power_law_1.2,2.4188908386230468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,2,1,power_law_1.2,2.8377401733398435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,2,1,power_law_1.2,3.6236474609375002
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,2,1,power_law_1.2,4.487686462402344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,2,1,power_law_1.01,0.03568703889846801
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,2,1,power_law_1.01,0.03944063901901245
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,2,1,power_law_1.2,6.047684326171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,2,1,power_law_1.2,23.69466796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,2,1,power_law_1.01,0.14701120376586913
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,2,1,power_law_1.01,0.05729152202606201
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,2,1,power_law_1.2,7.694515380859374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,2,1,power_law_1.01,0.0751743984222412
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,2,1,power_law_1.01,0.1787628746032715
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,2,1,power_law_1.01,0.18640192031860353
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,2,1,power_law_1.2,9.596386108398438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,2,1,power_law_1.01,0.19029823303222657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,2,1,power_law_1.01,0.09506496429443359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,2,1,power_law_1.01,0.16450496673583986
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,2,1,power_law_1.2,29.167363281249997
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,2,1,power_law_1.01,0.1665011215209961
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,2,1,power_law_1.01,0.20981632232666017
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,2,1,power_law_1.01,0.17127296447753906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,2,1,power_law_1.01,0.25708288192749024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,2,1,power_law_1.01,0.30647104263305663
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,2,1,power_law_1.01,0.1736934471130371
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,2,1,power_law_1.01,0.3557228851318359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,2,1,power_law_1.01,0.44471809387207034
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,2,1,power_law_1.01,0.9310598754882813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,2,1,power_law_1.01,0.19958208084106446
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,2,1,power_law_1.01,0.19571712493896484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,2,1,power_law_1.01,1.3413433837890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,2,1,power_law_1.01,0.21478399276733398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,2,1,power_law_1.01,0.036514561176300045
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,2,1,power_law_1.01,0.046520318984985355
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,2,1,power_law_1.01,0.059091839790344235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,2,1,power_law_1.01,0.07311039924621582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,2,1,power_law_1.01,0.22741247177124024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,2,1,power_law_1.01,0.10159999847412109
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,2,1,power_law_1.01,0.10908543586730957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,2,1,power_law_1.01,1.747271728515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,2,1,power_law_1.01,0.5370521545410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,2,1,power_law_1.01,0.11249600410461427
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,2,1,power_law_1.01,0.11433152198791503
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,2,1,power_law_1.01,0.1148192024230957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,2,1,power_law_1.01,0.11864000320434571
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,2,1,power_law_1.01,0.13788479804992676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,2,1,power_law_1.01,2.1083833312988283
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,2,1,power_law_1.01,0.13898880004882813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,2,1,power_law_1.01,0.14441984176635742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,2,1,power_law_1.01,0.14755711555480958
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,2,1,power_law_1.01,0.1510521602630615
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,2,1,power_law_1.01,0.1617100715637207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,2,1,power_law_1.01,0.17446527481079102
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,2,1,power_law_1.01,0.1867788887023926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,2,1,power_law_1.01,0.22336063385009766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,2,1,power_law_1.01,0.2620998382568359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,2,1,power_law_1.01,0.3330918502807617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,2,1,power_law_1.01,0.4038419342041015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,2,1,power_law_1.01,0.5515999984741211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,2,1,power_law_1.01,0.7010489654541016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,2,1,power_law_1.01,1.005132827758789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,2,1,power_law_1.01,0.03056256055831909
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,2,1,power_law_1.01,1.301846466064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,2,1,power_law_1.2,0.06963840007781982
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,2,1,power_law_1.01,0.7326541137695313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,2,1,power_law_1.01,1.6048352050781252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,2,1,power_law_1.2,0.1757619285583496
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,2,1,power_law_1.2,0.03703167915344238
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,2,1,power_law_1.2,0.051179518699646
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,2,1,power_law_1.2,0.035656960010528566
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,2,1,power_law_1.2,0.1940447998046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,2,1,power_law_1.2,0.14284223556518555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,2,1,power_law_1.2,0.08997056007385254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,2,1,power_law_1.2,0.19989887237548828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,2,1,power_law_1.2,0.15951616287231446
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,2,1,power_law_1.2,0.2185932731628418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,2,1,power_law_1.2,0.16858495712280272
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,2,1,power_law_1.2,0.22495359420776367
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,2,1,power_law_1.2,0.260505599975586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,2,1,power_law_1.2,0.17156095504760743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,2,1,power_law_1.2,0.31071487426757816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,2,1,power_law_1.2,0.36586814880371094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,2,1,power_law_1.2,0.44780929565429684
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,2,1,power_law_1.2,0.1821196746826172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,2,1,power_law_1.2,0.1890707206726074
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,2,1,power_law_1.2,0.5501343917846679
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,2,1,power_law_1.2,0.7403545379638672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,2,1,power_law_1.2,0.9440415954589844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,2,1,power_law_1.2,0.1931814384460449
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,2,1,power_law_1.2,0.036204800605773926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,2,1,power_law_1.2,0.04547264099121094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,2,1,power_law_1.2,0.055175681114196774
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,2,1,power_law_1.2,0.07067840099334717
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,2,1,power_law_1.2,0.10356479644775392
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,2,1,power_law_1.2,1.7311827087402343
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,2,1,power_law_1.2,0.11078911781311036
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,2,1,power_law_1.2,0.2106233596801758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,2,1,power_law_1.2,0.11276927947998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,2,1,power_law_1.2,0.11680959701538085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,2,1,power_law_1.2,2.152659912109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,2,1,power_law_1.2,0.1163488006591797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,2,1,power_law_1.2,0.11925696372985839
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,2,1,power_law_1.2,0.13990528106689454
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,2,1,power_law_1.2,0.14140800476074217
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,2,1,power_law_1.2,0.14681407928466797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,2,1,power_law_1.2,0.15143744468688963
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,2,1,power_law_1.2,0.15608575820922851
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,2,1,power_law_1.2,0.16717567443847656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,2,1,power_law_1.2,0.1762873649597168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,2,1,power_law_1.2,0.19108352661132813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,2,1,power_law_1.2,0.22829248428344728
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,2,1,power_law_1.2,0.26529024124145506
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,2,1,power_law_1.2,0.33530689239501954
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,2,1,power_law_1.2,0.4105753707885742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,2,1,power_law_1.2,0.5581785583496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,2,1,power_law_1.2,1.334197692871094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,2,1,power_law_1.01,0.06248447895050049
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,2,1,power_law_1.2,0.7130258941650391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,2,1,power_law_1.01,0.07617216110229492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,2,1,power_law_1.01,0.13492159843444823
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,2,1,power_law_1.2,1.0115647888183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,2,1,power_law_1.01,0.2858598327636719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,2,1,power_law_1.2,1.3139570617675782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,2,1,power_law_1.2,0.030668160915374755
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,2,1,power_law_1.01,0.5104147338867188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,2,1,power_law_1.2,1.6131814575195313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,2,1,power_law_1.01,0.5521587371826172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,2,1,power_law_1.01,0.5474111938476562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,2,1,power_law_1.01,0.582905616760254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,2,1,power_law_1.01,0.6080319976806641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,2,1,power_law_1.01,0.6450463867187499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,2,1,power_law_1.01,0.708361587524414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,2,1,power_law_1.01,0.6553369903564453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,2,1,power_law_1.01,0.21045888900756834
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,2,1,power_law_1.01,0.7207718658447265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,2,1,power_law_1.01,0.4730809783935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,2,1,power_law_1.01,0.7981881713867187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,2,1,power_law_1.01,0.9226105499267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,2,1,power_law_1.01,1.0873299407958985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,2,1,power_law_1.01,0.5324192047119141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,2,1,power_law_1.01,1.3937370300292968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,2,1,power_law_1.01,1.633811798095703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,2,1,power_law_1.01,0.055668478012084965
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,2,1,power_law_1.01,2.3103538513183595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,2,1,power_law_1.01,0.06029248237609863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,2,1,power_law_1.01,0.09778880119323731
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,2,1,power_law_1.01,0.13248319625854493
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,2,1,power_law_1.01,2.8969204711914065
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,2,1,power_law_1.01,0.16884799957275393
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,2,1,power_law_1.01,0.261909122467041
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,2,1,power_law_1.01,0.29549312591552734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,2,1,power_law_1.01,0.30185855865478517
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,2,1,power_law_1.01,0.5979577636718749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,2,1,power_law_1.01,0.3088569641113281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,2,1,power_law_1.01,0.31147840499877927
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,2,1,power_law_1.01,4.111942443847656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,2,1,power_law_1.01,0.3205062484741211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,2,1,power_law_1.01,0.3597491073608398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,2,1,power_law_1.01,0.3606969451904297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,2,1,power_law_1.01,0.3722323226928711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,2,1,power_law_1.01,0.3790047836303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,2,1,power_law_1.01,0.3830316925048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,2,1,power_law_1.01,0.662972183227539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,2,1,power_law_1.01,0.40285568237304686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,2,1,power_law_1.01,5.271357421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,2,1,power_law_1.01,0.4282444763183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.01,0.46907905578613285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.01,0.5451526260375976
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.01,0.6521273803710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.01,0.8320422363281249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.01,1.0161087799072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,2,1,power_law_1.01,6.55303955078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,2,1,power_law_1.2,0.06371071815490723
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.01,1.414176025390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,2,1,power_law_1.2,0.12516480445861816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,2,1,power_law_1.2,0.1896019172668457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.01,1.790965118408203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,2,1,power_law_1.2,0.2584012794494629
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,2,1,power_law_1.2,0.4806361770629882
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,2,1,power_law_1.2,0.5220959854125977
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.01,2.596449279785156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,2,1,power_law_1.2,0.5566412734985351
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,2,1,power_law_1.2,0.5851289749145507
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.01,3.373714599609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,2,1,power_law_1.2,0.6080358505249024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,2,1,power_law_1.2,0.07085887908935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,2,1,power_law_1.2,0.6506623840332031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.01,4.199135437011718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,2,1,power_law_1.2,0.6789778900146485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,2,1,power_law_1.2,0.7181330871582031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,2,1,power_law_1.2,0.6624057769775391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,2,1,power_law_1.2,0.7330924987792968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,2,1,power_law_1.2,0.8043468475341797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,2,1,power_law_1.2,0.9531142425537109
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,2,1,power_law_1.2,1.0955411529541015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,2,1,power_law_1.2,0.5497248077392578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,2,1,power_law_1.2,0.5584384155273437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,2,1,power_law_1.2,1.4141439819335937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,2,1,power_law_1.2,0.6298892974853516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,2,1,power_law_1.2,0.05515071868896484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,2,1,power_law_1.2,1.7056536865234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,2,1,power_law_1.2,0.057692799568176266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,2,1,power_law_1.2,0.08721664428710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,2,1,power_law_1.2,0.12031423568725585
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,2,1,power_law_1.2,2.2964044189453126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,2,1,power_law_1.2,0.15712512016296387
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,2,1,power_law_1.2,0.2692652893066406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,2,1,power_law_1.2,0.2952895927429199
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,2,1,power_law_1.2,0.308217601776123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,2,1,power_law_1.2,2.901814270019531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,2,1,power_law_1.2,0.3126201629638672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,2,1,power_law_1.2,0.3145427131652832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,2,1,power_law_1.2,0.3214080047607422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,2,1,power_law_1.2,0.36454334259033205
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,2,1,power_law_1.2,0.36871425628662113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,2,1,power_law_1.2,0.376701431274414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,2,1,power_law_1.2,0.38642879486083986
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,2,1,power_law_1.2,0.3923737716674805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,2,1,power_law_1.2,4.092545776367187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,2,1,power_law_1.2,0.4125145721435547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,2,1,power_law_1.2,0.43590145111083983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,2,1,power_law_1.2,0.4764831924438477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,2,1,power_law_1.2,0.5665907287597657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,2,1,power_law_1.2,0.65425537109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,2,1,power_law_1.2,0.8699878692626953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,2,1,power_law_1.2,1.0514636993408204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,2,1,power_law_1.2,5.333377685546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,2,1,power_law_1.2,1.3971110534667968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,2,1,power_law_1.01,0.19150272369384766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,2,1,power_law_1.2,1.831083526611328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,2,1,power_law_1.2,6.576314697265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,2,1,power_law_1.01,0.33880062103271485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,2,1,power_law_1.01,0.5511974334716797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,2,1,power_law_1.2,2.6179525756835935
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,2,1,power_law_1.01,0.7692288208007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,2,1,power_law_1.01,0.13758527755737304
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,2,1,power_law_1.2,3.420614929199219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,2,1,power_law_1.01,1.307869415283203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,2,1,power_law_1.01,1.4275712585449218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,2,1,power_law_1.01,1.5107968139648438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,2,1,power_law_1.01,1.5662425231933592
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,2,1,power_law_1.01,1.6111424255371094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,2,1,power_law_1.2,4.130508117675781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,2,1,power_law_1.01,1.6864218139648437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,2,1,power_law_1.01,1.8010105895996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,2,1,power_law_1.01,2.6288409423828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,2,1,power_law_1.01,2.698482666015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,2,1,power_law_1.01,2.8050149536132816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,2,1,power_law_1.01,2.875762634277344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,2,1,power_law_1.01,3.0338790893554686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,2,1,power_law_1.01,3.31961669921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,2,1,power_law_1.01,3.5283026123046874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,2,1,power_law_1.01,3.972574157714844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,2,1,power_law_1.01,4.6299108886718745
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,2,1,power_law_1.01,0.09144512176513672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,2,1,power_law_1.01,5.7916717529296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,2,1,power_law_1.01,0.13295488357543944
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,2,1,power_law_1.01,0.17907775878906249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,2,1,power_law_1.01,0.31281471252441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,2,1,power_law_1.01,7.161315307617187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,2,1,power_law_1.01,0.4311705780029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,2,1,power_law_1.01,0.7152992248535156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,2,1,power_law_1.01,0.7721177673339843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,2,1,power_law_1.01,0.8068434906005859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,2,1,power_law_1.01,0.834958724975586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,2,1,power_law_1.01,0.8534381103515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,2,1,power_law_1.01,0.8702642822265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,2,1,power_law_1.01,10.27577392578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,2,1,power_law_1.01,0.890610580444336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,2,1,power_law_1.01,0.969315185546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,2,1,power_law_1.01,0.9622470092773436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,2,1,power_law_1.01,1.0165017700195311
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,2,1,power_law_1.01,1.0047846221923828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,2,1,power_law_1.01,13.017381591796873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,2,1,power_law_1.01,1.0584486389160157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,2,1,power_law_1.01,1.1056102752685546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.01,1.253091812133789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.01,1.4085031127929688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.01,1.5895558166503907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.01,2.049557800292969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.01,2.423255615234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.01,3.288974609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,2,1,power_law_1.2,0.13897472381591797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,2,1,power_law_1.01,18.2975244140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.01,4.174082641601562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,2,1,power_law_1.2,0.15319104194641114
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,2,1,power_law_1.2,0.33857471466064454
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,2,1,power_law_1.2,0.4760742568969727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,2,1,power_law_1.2,0.6632236480712891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,2,1,power_law_1.2,1.2976800537109374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.01,5.7656201171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,2,1,power_law_1.2,1.4323263549804688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,2,1,power_law_1.2,1.5421760559082032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,2,1,power_law_1.2,1.608440246582031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.01,7.5905957031249995
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,2,1,power_law_1.2,1.6723660278320314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,2,1,power_law_1.01,23.9609521484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,2,1,power_law_1.2,1.7500344848632814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,2,1,power_law_1.2,1.850682830810547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.01,9.518595581054687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,2,1,power_law_1.2,2.735638427734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,2,1,power_law_1.2,2.7948980712890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,2,1,power_law_1.2,2.9518002319335936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,2,1,power_law_1.2,3.012115173339844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,2,1,power_law_1.2,3.1379827880859374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,2,1,power_law_1.2,3.343229370117187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,2,1,power_law_1.2,3.5399819946289064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,2,1,power_law_1.01,29.819272460937498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,2,1,power_law_1.2,4.119385681152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,2,1,power_law_1.2,4.692054443359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,2,1,power_law_1.2,5.9976000976562505
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,2,1,power_law_1.2,0.10105600357055664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,2,1,power_law_1.2,0.17428863525390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,2,1,power_law_1.2,7.305574951171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,2,1,power_law_1.2,0.2783449554443359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,2,1,power_law_1.2,0.3781299209594727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,2,1,power_law_1.2,0.7077401733398437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,2,1,power_law_1.2,0.7718854522705078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,2,1,power_law_1.2,0.09046848297119141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,2,1,power_law_1.2,10.372872314453124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,2,1,power_law_1.2,0.8224070739746093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,2,1,power_law_1.2,0.8541555023193359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,2,1,power_law_1.2,0.8699987030029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,2,1,power_law_1.2,0.8951923370361328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,2,1,power_law_1.2,0.9152352142333985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,2,1,power_law_1.2,1.007928924560547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,2,1,power_law_1.2,1.0282559967041016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,2,1,power_law_1.2,12.95808349609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,2,1,power_law_1.2,1.05893310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,2,1,power_law_1.2,1.0707904052734374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,2,1,power_law_1.2,1.1053913879394532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,2,1,power_law_1.2,1.1922796630859376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,2,1,power_law_1.2,1.2607552337646486
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,2,1,power_law_1.2,1.457918701171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,2,1,power_law_1.2,1.6566790771484374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,2,1,power_law_1.2,2.101137237548828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,2,1,power_law_1.2,2.489971771240234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,2,1,power_law_1.2,3.3215756225585933
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,2,1,power_law_1.2,18.517586669921876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,2,1,power_law_1.2,4.14302978515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,2,1,power_law_1.01,0.1733318328857422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,2,1,power_law_1.01,0.2528377532958984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,2,1,power_law_1.01,0.5077907180786132
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,2,1,power_law_1.01,0.453770866394043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,2,1,power_law_1.2,5.837715454101563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,2,1,power_law_1.01,1.0414278411865234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,2,1,power_law_1.01,1.5272146606445314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,2,1,power_law_1.01,1.7981459045410155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,2,1,power_law_1.2,7.483731079101562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,2,1,power_law_1.01,2.3858111572265623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,2,1,power_law_1.2,24.25717041015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,2,1,power_law_1.01,2.5461196899414062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,2,1,power_law_1.2,9.682267456054687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,2,1,power_law_1.01,2.6557406616210937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,2,1,power_law_1.01,2.7772882080078127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,2,1,power_law_1.01,2.871932067871094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,2,1,power_law_1.01,2.990035095214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,2,1,power_law_1.01,3.1581600952148436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,2,1,power_law_1.01,3.327408752441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,2,1,power_law_1.2,30.03066162109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,2,1,power_law_1.01,3.6199224853515624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,2,1,power_law_1.01,5.064739990234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,2,1,power_law_1.01,5.4870629882812505
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,2,1,power_law_1.01,5.842353515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,2,1,power_law_1.01,6.5153125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,2,1,power_law_1.01,7.049515991210937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,2,1,power_law_1.01,0.10945664405822755
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,2,1,power_law_1.01,8.11939453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,2,1,power_law_1.01,0.1559878444671631
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,2,1,power_law_1.01,9.454866943359374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,2,1,power_law_1.01,0.24016256332397462
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,2,1,power_law_1.01,0.2902067184448242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,2,1,power_law_1.01,0.5798348617553711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,2,1,power_law_1.01,0.8336608123779297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,2,1,power_law_1.01,12.00421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,2,1,power_law_1.01,0.9796998596191406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,2,1,power_law_1.01,1.2865689086914063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,2,1,power_law_1.01,1.369220428466797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,2,1,power_law_1.01,1.4302700805664064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,2,1,power_law_1.01,1.4898541259765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,2,1,power_law_1.01,14.33751220703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,2,1,power_law_1.01,1.5271653747558593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,2,1,power_law_1.01,1.5662797546386718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,2,1,power_law_1.01,1.629443817138672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,2,1,power_law_1.01,1.6612095642089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,2,1,power_law_1.01,1.6943685913085935
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,2,1,power_law_1.01,1.9540173339843752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,2,1,power_law_1.01,2.026225280761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.01,2.1764198303222657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.01,2.3660922241210938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,2,1,power_law_1.01,19.511601562499997
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.01,2.525587158203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.01,2.889576416015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.01,3.3068728637695317
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,2,1,power_law_1.2,0.17446592330932617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.01,4.1538388061523435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,2,1,power_law_1.01,24.77380615234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,2,1,power_law_1.2,0.2427622413635254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.01,4.913459777832031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,2,1,power_law_1.2,0.33638721466064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,2,1,power_law_1.2,0.5032211303710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,2,1,power_law_1.2,0.9103218841552735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.01,6.482218627929687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,2,1,power_law_1.2,1.371345977783203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,2,1,power_law_1.2,1.605030975341797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,2,1,power_law_1.2,2.272086334228516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.01,8.198251953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,2,1,power_law_1.2,2.409601287841797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,2,1,power_law_1.2,2.5442233276367188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,2,1,power_law_1.01,30.2342041015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,2,1,power_law_1.2,2.710604248046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,2,1,power_law_1.2,2.830097961425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.01,10.560429687500001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,2,1,power_law_1.2,2.9204089355468748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,2,1,power_law_1.2,3.141695861816406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,2,1,power_law_1.2,3.3549209594726563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,2,1,power_law_1.2,3.582030029296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,2,1,power_law_1.2,5.119956970214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,2,1,power_law_1.2,5.608402709960937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,2,1,power_law_1.2,6.026377563476562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,2,1,power_law_1.2,6.709703979492187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,2,1,power_law_1.2,7.335429077148437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,2,1,power_law_1.2,0.10926591873168945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,2,1,power_law_1.2,8.564876098632812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,2,1,power_law_1.2,0.15608768463134765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,2,1,power_law_1.2,0.20009599685668947
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,2,1,power_law_1.2,9.936490478515626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,2,1,power_law_1.2,0.2918163108825683
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,2,1,power_law_1.2,0.5048339080810547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,2,1,power_law_1.2,0.7432166290283203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,2,1,power_law_1.2,0.8730912017822267
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,2,1,power_law_1.2,12.391912841796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,2,1,power_law_1.2,1.2258380889892577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,2,1,power_law_1.2,1.2973651123046874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,2,1,power_law_1.2,1.364812774658203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,2,1,power_law_1.2,1.4429951477050782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,2,1,power_law_1.2,1.48991943359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,2,1,power_law_1.2,15.014631347656252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,2,1,power_law_1.2,1.5259199523925782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,2,1,power_law_1.2,1.5975897216796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,2,1,power_law_1.2,1.6403826904296874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,2,1,power_law_1.2,1.6951008605957032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,2,1,power_law_1.2,1.9736300659179686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,2,1,power_law_1.2,2.1006675720214845
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,2,1,power_law_1.2,2.223105926513672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,2,1,power_law_1.2,2.4394898986816407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,2,1,power_law_1.2,20.017440185546874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,2,1,power_law_1.2,2.635074462890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,2,1,power_law_1.2,3.111927185058594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,2,1,power_law_1.2,3.515475158691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,2,1,power_law_1.2,4.305274963378906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,2,1,power_law_1.2,5.011409912109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,2,1,power_law_1.2,25.3391455078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,4,1,power_law_1.01,0.06994495868682862
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,2,1,power_law_1.2,6.73096923828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,4,1,power_law_1.01,0.10501952171325683
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,4,1,power_law_1.01,0.12635840415954588
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,4,1,power_law_1.01,0.1969503974914551
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,2,1,power_law_1.2,8.458611450195312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,4,1,power_law_1.01,0.2045510482788086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,4,1,power_law_1.01,0.2180486488342285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,2,1,power_law_1.2,30.824677734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,2,1,power_law_1.2,10.497004394531249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,4,1,power_law_1.01,0.1912006378173828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,4,1,power_law_1.01,0.22779008865356448
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,4,1,power_law_1.01,0.19753664016723632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,4,1,power_law_1.01,0.19533632278442384
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,4,1,power_law_1.01,0.2806528091430664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,4,1,power_law_1.01,0.2432480049133301
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,4,1,power_law_1.01,0.37420799255371096
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,4,1,power_law_1.01,0.21245759963989258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,4,1,power_law_1.01,0.6022969436645508
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,4,1,power_law_1.01,0.26323007583618163
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,4,1,power_law_1.01,0.7417203521728515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,4,1,power_law_1.01,1.3916467285156249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,4,1,power_law_1.01,2.034839630126953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,4,1,power_law_1.01,2.626604309082031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,4,1,power_law_1.01,3.937534790039062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,4,1,power_law_1.01,0.2829363250732422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,4,1,power_law_1.01,0.2780575942993164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,4,1,power_law_1.01,0.2823814392089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,4,1,power_law_1.01,0.4287571334838868
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,4,1,power_law_1.01,5.186142578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,4,1,power_law_1.01,1.0361542510986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,4,1,power_law_1.01,0.06647168159484863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,4,1,power_law_1.01,0.11822400093078614
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,4,1,power_law_1.01,0.11531904220581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,4,1,power_law_1.01,6.699945068359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,4,1,power_law_1.01,0.15243776321411134
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,4,1,power_law_1.01,0.11476032257080078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,4,1,power_law_1.01,0.04919487953186035
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,4,1,power_law_1.01,0.11289728164672852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,4,1,power_law_1.01,0.1422329616546631
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,4,1,power_law_1.01,0.14506175994873047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,4,1,power_law_1.01,0.1623142433166504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,4,1,power_law_1.01,0.12084927558898925
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,4,1,power_law_1.01,0.0783135986328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,4,1,power_law_1.01,0.16928512573242188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,4,1,power_law_1.01,0.11962304115295411
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,4,1,power_law_1.01,0.16871423721313478
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,4,1,power_law_1.01,0.21915071487426757
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,4,1,power_law_1.01,0.1162700843811035
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.01,0.4052358245849609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.01,0.6008121490478515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.01,0.749151382446289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.01,1.4876856994628906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,4,1,power_law_1.2,0.06821631908416748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,4,1,power_law_1.2,0.09344703674316406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,4,1,power_law_1.01,0.15103487968444823
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.01,2.2764492797851563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.01,2.999139709472656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.01,3.7443923950195312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,4,1,power_law_1.2,0.1965580749511719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,4,1,power_law_1.2,0.1974323272705078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,4,1,power_law_1.2,0.20207807540893558
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,4,1,power_law_1.2,0.10668607711791993
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,4,1,power_law_1.2,0.18993919372558593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,4,1,power_law_1.2,0.1876371192932129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,4,1,power_law_1.2,0.251461124420166
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,4,1,power_law_1.2,0.2556883239746094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,4,1,power_law_1.2,0.2105292892456055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,4,1,power_law_1.2,0.2758745574951172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,4,1,power_law_1.2,0.294069766998291
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,4,1,power_law_1.2,0.2865350341796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,4,1,power_law_1.2,0.28234176635742186
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.01,0.2465203285217285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,4,1,power_law_1.2,0.3662623977661133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.01,0.33140926361083983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,4,1,power_law_1.2,0.43596351623535157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,4,1,power_law_1.2,0.579870719909668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,4,1,power_law_1.2,0.724540786743164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,4,1,power_law_1.2,1.108814697265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.01,1.1367123413085938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,4,1,power_law_1.2,1.3669293212890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,4,1,power_law_1.2,0.23492544174194335
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,4,1,power_law_1.2,2.0214898681640627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,4,1,power_law_1.2,0.21111936569213868
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,4,1,power_law_1.2,2.691441955566406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,4,1,power_law_1.2,0.11950976371765136
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,4,1,power_law_1.2,0.11125823974609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,4,1,power_law_1.2,0.11454143524169921
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,4,1,power_law_1.2,0.11777407646179198
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,4,1,power_law_1.2,0.11544896125793458
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,4,1,power_law_1.2,0.1177798366546631
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,4,1,power_law_1.2,0.12374719619750976
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,4,1,power_law_1.2,0.1370790386199951
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,4,1,power_law_1.2,3.881197509765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,4,1,power_law_1.2,0.06324543952941894
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,4,1,power_law_1.2,0.14420543670654298
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,4,1,power_law_1.2,0.15075072288513183
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,4,1,power_law_1.2,0.1465567970275879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,4,1,power_law_1.2,0.15803071975708008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,4,1,power_law_1.2,0.1692064094543457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,4,1,power_law_1.2,0.16946176528930662
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,4,1,power_law_1.2,0.21689151763916015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,4,1,power_law_1.2,0.24775871276855468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,4,1,power_law_1.2,0.41791934967041017
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,4,1,power_law_1.2,0.5844192123413086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,4,1,power_law_1.2,5.190844116210938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,4,1,power_law_1.2,0.7563660430908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,4,1,power_law_1.2,1.126376953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,4,1,power_law_1.2,0.04899456024169922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,4,1,power_law_1.2,0.07499968051910401
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,4,1,power_law_1.2,6.3719024658203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,4,1,power_law_1.2,1.4707597351074218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,4,1,power_law_1.01,0.09436479568481446
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,4,1,power_law_1.2,2.272051239013672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,4,1,power_law_1.2,2.944180603027344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,4,1,power_law_1.2,3.731919250488281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,4,1,power_law_1.01,0.324983024597168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,4,1,power_law_1.01,0.1861894416809082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,4,1,power_law_1.01,0.30221439361572267
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,4,1,power_law_1.01,0.3185728073120117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,4,1,power_law_1.01,0.3562188720703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,4,1,power_law_1.01,0.36433151245117185
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,4,1,power_law_1.01,0.3038457679748535
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,4,1,power_law_1.01,0.4065836715698242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,4,1,power_law_1.01,0.1508633613586426
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,4,1,power_law_1.01,0.39652862548828127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,4,1,power_law_1.2,0.31971647262573244
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,4,1,power_law_1.01,0.39363903045654297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,4,1,power_law_1.01,0.4226201629638672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,4,1,power_law_1.01,0.7297433471679687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,4,1,power_law_1.01,0.34989505767822265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,4,1,power_law_1.01,0.3558163070678711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,4,1,power_law_1.01,1.7909266662597656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,4,1,power_law_1.01,0.3130656051635742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,4,1,power_law_1.01,2.326252746582031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,4,1,power_law_1.01,3.3854757690429684
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,4,1,power_law_1.01,4.3861563110351565
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,4,1,power_law_1.01,0.4697190475463867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,4,1,power_law_1.01,0.6178739166259766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,4,1,power_law_1.01,0.9854252624511719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,4,1,power_law_1.01,1.212784652709961
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,4,1,power_law_1.01,6.47213134765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,4,1,power_law_1.01,0.061667199134826656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,4,1,power_law_1.01,0.17825536727905272
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,4,1,power_law_1.01,0.17664575576782227
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,4,1,power_law_1.01,0.1777280044555664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,4,1,power_law_1.01,9.218988037109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,4,1,power_law_1.01,0.18360448837280274
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,4,1,power_law_1.01,0.19948352813720702
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,4,1,power_law_1.01,0.19360319137573243
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,4,1,power_law_1.01,0.08886528015136719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,4,1,power_law_1.01,0.2059270477294922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,4,1,power_law_1.01,0.17939647674560547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,4,1,power_law_1.01,0.2457209587097168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,4,1,power_law_1.01,0.262360954284668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.01,0.38896961212158204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,4,1,power_law_1.01,0.17731264114379883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.01,0.5364851379394532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.01,0.6608422088623047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,4,1,power_law_1.01,0.11365504264831543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,4,1,power_law_1.01,0.17804607391357422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.01,0.9567520141601562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,4,1,power_law_1.01,11.1871240234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.01,1.2506195068359376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.01,1.8567289733886718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.01,2.4963104248046877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.01,3.6419244384765626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,4,1,power_law_1.01,0.22615936279296872
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.01,4.894040832519531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,4,1,power_law_1.2,0.09358016014099121
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,4,1,power_law_1.01,0.22815040588378904
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,4,1,power_law_1.2,0.34373374938964846
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,4,1,power_law_1.01,0.34382976531982423
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,4,1,power_law_1.2,0.35039936065673827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,4,1,power_law_1.2,0.3653747177124024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.01,5.977447509765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,4,1,power_law_1.2,0.3253433609008789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,4,1,power_law_1.2,0.3678854370117187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,4,1,power_law_1.2,0.39608768463134764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,4,1,power_law_1.2,0.4021222305297852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,4,1,power_law_1.2,0.3997094345092774
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,4,1,power_law_1.2,0.44231296539306636
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,4,1,power_law_1.2,0.13758655548095705
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,4,1,power_law_1.2,0.17122495651245118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,4,1,power_law_1.2,0.604664306640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,4,1,power_law_1.2,0.7091187286376953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,4,1,power_law_1.2,0.2894630432128906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,4,1,power_law_1.2,0.3046169662475586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,4,1,power_law_1.2,1.7500979614257812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,4,1,power_law_1.2,0.3581324768066406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,4,1,power_law_1.2,2.304149169921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,4,1,power_law_1.2,0.31319551467895507
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,4,1,power_law_1.2,3.367771606445312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,4,1,power_law_1.2,0.06321087837219239
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,4,1,power_law_1.2,4.375790710449219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,4,1,power_law_1.2,0.49748352050781247
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,4,1,power_law_1.2,0.9796761322021486
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,4,1,power_law_1.2,6.575946655273438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,4,1,power_law_1.2,0.17775423049926758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,4,1,power_law_1.2,1.2314009857177735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,4,1,power_law_1.2,0.17990720748901368
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,4,1,power_law_1.2,0.1817056083679199
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,4,1,power_law_1.2,0.17865728378295898
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,4,1,power_law_1.2,0.18117567062377932
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,4,1,power_law_1.2,0.19604799270629883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,4,1,power_law_1.2,0.19635648727416993
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,4,1,power_law_1.2,0.20057279586791993
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,4,1,power_law_1.2,0.22789440155029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,4,1,power_law_1.2,0.23126207351684572
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,4,1,power_law_1.2,0.25382400512695313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,4,1,power_law_1.2,0.27912767410278316
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,4,1,power_law_1.2,0.08231103897094727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,4,1,power_law_1.2,0.3334732818603515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,4,1,power_law_1.2,0.3856224060058594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,4,1,power_law_1.2,0.5175654220581054
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,4,1,power_law_1.2,9.169203491210938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,4,1,power_law_1.2,0.6742829132080078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,4,1,power_law_1.2,0.18885887145996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,4,1,power_law_1.2,0.9493196868896485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,4,1,power_law_1.2,1.2977343749999999
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,4,1,power_law_1.2,1.9168057250976562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,4,1,power_law_1.2,0.10613439559936524
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,4,1,power_law_1.2,2.5211257934570312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,4,1,power_law_1.01,0.11540608406066895
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,4,1,power_law_1.2,0.17722175598144532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,4,1,power_law_1.01,0.1467679977416992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,4,1,power_law_1.2,11.16489013671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,4,1,power_law_1.01,0.16532159805297852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,4,1,power_law_1.2,3.623735656738281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,4,1,power_law_1.01,0.3117299270629883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,4,1,power_law_1.01,0.48281600952148435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,4,1,power_law_1.01,0.6739027404785156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,4,1,power_law_1.01,0.9343987274169923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,4,1,power_law_1.2,4.811272888183593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,4,1,power_law_1.01,0.9695244598388673
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,4,1,power_law_1.01,1.0062694549560547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,4,1,power_law_1.01,1.0292269134521486
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,4,1,power_law_1.01,1.0893312072753907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,4,1,power_law_1.01,1.1403084564208985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,4,1,power_law_1.2,5.976026000976562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,4,1,power_law_1.01,1.1773638153076171
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,4,1,power_law_1.01,1.2664268493652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,4,1,power_law_1.01,1.8182745361328123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,4,1,power_law_1.01,1.853520050048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,4,1,power_law_1.01,1.910113983154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,4,1,power_law_1.01,2.06032958984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,4,1,power_law_1.01,2.1990144348144534
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,4,1,power_law_1.01,2.513981475830078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,4,1,power_law_1.01,2.8073529052734374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,4,1,power_law_1.01,0.07857855796813965
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,4,1,power_law_1.01,3.354946594238281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,4,1,power_law_1.01,0.10005824089050293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,4,1,power_law_1.01,3.904082641601563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,4,1,power_law_1.01,0.1113484764099121
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,4,1,power_law_1.01,0.18500991821289064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,4,1,power_law_1.01,0.284531192779541
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,4,1,power_law_1.01,5.289182739257813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,4,1,power_law_1.01,0.3670048141479492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,4,1,power_law_1.01,0.5184780883789062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,4,1,power_law_1.01,0.5423756790161133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,4,1,power_law_1.01,0.5595808029174805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,4,1,power_law_1.01,0.572465934753418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,4,1,power_law_1.01,6.6671630859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,4,1,power_law_1.01,0.60202880859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,4,1,power_law_1.01,0.6275654220581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,4,1,power_law_1.01,0.6425740814208984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,4,1,power_law_1.01,0.6661542510986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,4,1,power_law_1.01,0.7558265686035156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,4,1,power_law_1.01,0.7640953826904296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,4,1,power_law_1.01,0.8206400299072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,4,1,power_law_1.01,0.8552889251708985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.01,0.9041843414306641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,4,1,power_law_1.01,9.71512939453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.01,1.0148684692382812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.01,1.1053939056396485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.01,1.3576364135742187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.01,1.635167999267578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.01,2.1423251342773435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,4,1,power_law_1.2,0.11560319900512694
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,4,1,power_law_1.01,12.578676757812499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,4,1,power_law_1.2,0.1439788818359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,4,1,power_law_1.2,0.15188544273376464
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.01,2.6282138061523437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,4,1,power_law_1.2,0.27756671905517577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,4,1,power_law_1.2,0.449549446105957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.01,3.664426879882812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,4,1,power_law_1.2,0.5920691299438476
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,4,1,power_law_1.2,0.9101267242431641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,4,1,power_law_1.2,0.9617497253417969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.01,4.637795104980468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,4,1,power_law_1.2,0.9932588958740235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,4,1,power_law_1.01,15.302740478515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,4,1,power_law_1.2,1.022119674682617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,4,1,power_law_1.2,1.106258544921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,4,1,power_law_1.2,1.1437657928466796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.01,5.593434448242188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,4,1,power_law_1.2,1.204035186767578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,4,1,power_law_1.2,1.3147584533691405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,4,1,power_law_1.2,1.852812805175781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,4,1,power_law_1.2,1.889327392578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,4,1,power_law_1.2,1.9726943969726562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,4,1,power_law_1.2,2.1893145751953123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,4,1,power_law_1.2,2.3198316955566405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,4,1,power_law_1.2,2.635053405761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,4,1,power_law_1.2,2.8895602416992188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,4,1,power_law_1.2,3.4634475708007812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,4,1,power_law_1.2,0.07829055786132813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,4,1,power_law_1.2,0.09867839813232422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,4,1,power_law_1.2,0.105731201171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,4,1,power_law_1.2,4.112611694335937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,4,1,power_law_1.2,0.1802707290649414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,4,1,power_law_1.2,0.2566457557678222
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,4,1,power_law_1.2,0.3361715316772461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,4,1,power_law_1.2,5.39260498046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,4,1,power_law_1.2,0.5025798416137695
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,4,1,power_law_1.2,0.533230094909668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,4,1,power_law_1.2,0.5526188659667969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,4,1,power_law_1.2,0.568384017944336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,4,1,power_law_1.2,6.782071533203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,4,1,power_law_1.2,0.5973920059204102
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,4,1,power_law_1.2,0.6277593612670899
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,4,1,power_law_1.2,0.6473696136474609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,4,1,power_law_1.2,0.679797134399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,4,1,power_law_1.2,0.7750252532958984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,4,1,power_law_1.2,0.7929126739501953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,4,1,power_law_1.2,0.8446112060546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,4,1,power_law_1.2,0.8964364624023438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,4,1,power_law_1.2,9.904381713867187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,4,1,power_law_1.2,0.9502169799804687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,4,1,power_law_1.2,1.0709177398681642
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,4,1,power_law_1.2,1.1894214630126954
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,4,1,power_law_1.2,1.4305599975585939
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,4,1,power_law_1.2,1.739509735107422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,4,1,power_law_1.2,2.2052166748046877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,4,1,power_law_1.2,12.571766357421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,4,1,power_law_1.2,2.706065979003906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,4,1,power_law_1.2,3.7484371948242186
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,4,1,power_law_1.01,0.027053439617156984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,4,1,power_law_1.2,4.676217041015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,4,1,power_law_1.2,15.259033203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,4,1,power_law_1.01,0.042259840965270995
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,4,1,power_law_1.01,0.03566528081893921
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,4,1,power_law_1.01,0.0530291223526001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,4,1,power_law_1.2,5.737750854492187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,4,1,power_law_1.01,0.06122623920440674
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,4,1,power_law_1.01,0.09710975646972655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,4,1,power_law_1.01,0.10018367767333984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,4,1,power_law_1.01,0.08576959609985352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,4,1,power_law_1.01,0.09893759727478027
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,4,1,power_law_1.01,0.10134655952453613
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,4,1,power_law_1.01,0.11519295692443847
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,4,1,power_law_1.01,0.12153663635253906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,4,1,power_law_1.01,0.1930086326599121
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,4,1,power_law_1.01,0.11957695960998535
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,4,1,power_law_1.01,0.21879743576049804
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,4,1,power_law_1.01,0.12961728096008301
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,4,1,power_law_1.01,0.13316736221313477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,4,1,power_law_1.01,0.13538496017456053
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,4,1,power_law_1.01,0.14246335983276368
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,4,1,power_law_1.01,0.1531443214416504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,4,1,power_law_1.01,0.23542207717895508
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,4,1,power_law_1.01,0.3162630462646484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,4,1,power_law_1.01,0.37890880584716796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,4,1,power_law_1.01,0.5209171295166015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,4,1,power_law_1.01,0.6619705963134765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,4,1,power_law_1.01,0.9474956512451171
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,4,1,power_law_1.01,1.2209760284423827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,4,1,power_law_1.01,1.50396484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,4,1,power_law_1.01,0.029489281177520754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,4,1,power_law_1.01,0.03292288064956665
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,4,1,power_law_1.01,0.03723135948181152
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,4,1,power_law_1.01,0.045067520141601564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,4,1,power_law_1.01,0.051134080886840814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,4,1,power_law_1.01,0.06457151889801024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,4,1,power_law_1.01,0.08458047866821289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,4,1,power_law_1.01,0.09154623985290528
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,4,1,power_law_1.01,0.10293696403503419
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,4,1,power_law_1.01,0.10867520332336426
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,4,1,power_law_1.01,0.06905344009399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,4,1,power_law_1.01,0.07023551940917969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,4,1,power_law_1.01,0.07373760223388673
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,4,1,power_law_1.01,0.07196544170379639
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,4,1,power_law_1.01,0.07809855937957763
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,4,1,power_law_1.01,0.08139519691467285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,4,1,power_law_1.01,0.10635007858276366
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,4,1,power_law_1.01,0.11991295814514161
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,4,1,power_law_1.01,0.25986175537109374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,4,1,power_law_1.01,0.13047807693481445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,4,1,power_law_1.01,0.1889561653137207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,4,1,power_law_1.01,0.17256959915161132
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,2048,768,8,128,4,1,power_law_1.2,0.02709183931350708
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,4,1,power_law_1.01,0.3114828872680664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,4,1,power_law_1.01,0.437322883605957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,4,1,power_law_1.01,0.5545695877075195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,2048,768,8,128,4,1,power_law_1.2,0.038581759929656984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,2048,768,8,128,4,1,power_law_1.2,0.04843455791473389
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,4,1,power_law_1.01,0.7943801879882812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,2048,768,8,128,4,1,power_law_1.2,0.035727360248565675
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,2048,768,8,128,4,1,power_law_1.2,0.05870528221130371
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,4,1,power_law_1.01,1.0319058990478516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,4,1,power_law_1.01,1.2688057708740235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,2048,768,8,128,4,1,power_law_1.2,0.11938495635986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,2048,768,8,128,4,1,power_law_1.2,0.12189696311950685
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,2048,768,8,128,4,1,power_law_1.2,0.09508416175842285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,2048,768,8,128,4,1,power_law_1.2,0.09871423721313477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,2048,768,8,128,4,1,power_law_1.2,0.0877779197692871
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,2048,768,8,128,4,1,power_law_1.2,0.10045311927795411
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,2048,768,8,128,4,1,power_law_1.2,0.09966143608093261
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,2048,768,8,128,4,1,power_law_1.2,0.19491455078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,2048,768,8,128,4,1,power_law_1.2,0.22716096878051756
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,2048,768,8,128,4,1,power_law_1.2,0.31728895187377926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,2048,768,8,128,4,1,power_law_1.2,0.11590463638305663
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,2048,768,8,128,4,1,power_law_1.2,0.5286982345581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,2048,768,8,128,4,1,power_law_1.2,0.13109312057495118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,2048,768,8,128,4,1,power_law_1.2,0.13285183906555176
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,2048,768,8,128,4,1,power_law_1.2,0.1357158374786377
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,2048,768,8,128,4,1,power_law_1.2,0.14306816101074218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,2048,768,8,128,4,1,power_law_1.2,0.1535424041748047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,2048,768,8,128,4,1,power_law_1.2,0.6673248291015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,2048,768,8,128,4,1,power_law_1.2,0.03691135883331299
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,2048,768,8,128,4,1,power_law_1.2,0.04342912197113037
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,2048,768,8,128,4,1,power_law_1.2,1.22621826171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,2048,768,8,128,4,1,power_law_1.2,0.23595327377319336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,2048,768,8,128,4,1,power_law_1.2,0.04948607921600342
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,2048,768,8,128,4,1,power_law_1.2,1.513978271484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,2048,768,8,128,4,1,power_law_1.2,0.06643775939941407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,2048,768,8,128,4,1,power_law_1.2,0.06881919860839844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,2048,768,8,128,4,1,power_law_1.2,0.07095615863800049
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,2048,768,8,128,4,1,power_law_1.2,0.0733196783065796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,2048,768,8,128,4,1,power_law_1.2,0.38949760437011716
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,2048,768,8,128,4,1,power_law_1.2,0.07499392032623291
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,2048,768,8,128,4,1,power_law_1.2,0.07871935844421388
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,2048,768,8,128,4,1,power_law_1.2,0.0822815990447998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,2048,768,8,128,4,1,power_law_1.2,0.08680704116821289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,2048,768,8,128,4,1,power_law_1.2,0.09256832122802734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,2048,768,8,128,4,1,power_law_1.2,0.102673282623291
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,2048,768,8,128,4,1,power_law_1.2,0.10896575927734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,2048,768,8,128,4,1,power_law_1.2,0.176428165435791
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,2048,768,8,128,4,1,power_law_1.2,0.9528038024902343
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,2048,768,8,128,4,1,power_law_1.2,0.02980544090270996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,2048,768,8,128,4,1,power_law_1.2,0.03283711910247803
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,2048,768,8,128,4,1,power_law_1.2,0.2598470306396484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,2048,768,8,128,4,1,power_law_1.2,0.3192947196960449
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,2048,768,8,128,4,1,power_law_1.2,0.4402361679077148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,2048,768,8,128,4,1,power_law_1.2,0.5574700927734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,2048,768,8,128,4,1,power_law_1.2,0.12041791915893554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,2048,768,8,128,4,1,power_law_1.2,0.10786175727844238
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,2048,768,8,128,4,1,power_law_1.2,0.7966073608398437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,2048,768,8,128,4,1,power_law_1.2,1.035533447265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,4,1,power_law_1.01,0.12056896209716797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,2048,768,8,128,4,1,power_law_1.2,1.2782803344726563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,2048,768,8,128,4,1,power_law_1.2,0.18835968017578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,2048,768,8,128,4,1,power_law_1.2,0.13240896224975587
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,4,1,power_law_1.01,0.2903968048095703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,4,1,power_law_1.01,0.2983628845214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,4,1,power_law_1.01,0.31952896118164065
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,4,1,power_law_1.01,0.055382399559021
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,4,1,power_law_1.01,0.08084223747253419
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,4,1,power_law_1.01,0.0503276777267456
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,4,1,power_law_1.01,0.3352268981933594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,4,1,power_law_1.01,0.3398796844482422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,4,1,power_law_1.01,0.33834815979003907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,4,1,power_law_1.01,0.24771263122558596
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,4,1,power_law_1.01,0.38585792541503905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,4,1,power_law_1.01,0.37023937225341796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,4,1,power_law_1.01,0.40097793579101565
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,4,1,power_law_1.01,0.16020544052124025
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,4,1,power_law_1.01,0.4515737533569336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,4,1,power_law_1.01,0.5372294235229492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,4,1,power_law_1.01,0.6340198516845703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,4,1,power_law_1.01,0.7806111907958984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,4,1,power_law_1.01,0.9453330993652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,4,1,power_law_1.01,0.29227968215942385
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,4,1,power_law_1.01,0.3012646484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,4,1,power_law_1.01,0.04289919853210449
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,4,1,power_law_1.01,0.04966015815734863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,4,1,power_law_1.01,1.307464904785156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,4,1,power_law_1.01,0.06542208194732665
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,4,1,power_law_1.01,1.6676287841796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,4,1,power_law_1.01,0.0882323169708252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,4,1,power_law_1.01,0.11354240417480468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,4,1,power_law_1.01,0.16571903228759766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,4,1,power_law_1.01,0.182030086517334
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,4,1,power_law_1.01,0.18421567916870116
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,4,1,power_law_1.01,0.18915136337280275
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,4,1,power_law_1.01,2.4061351013183594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,4,1,power_law_1.01,0.1904876708984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,4,1,power_law_1.01,0.34499584197998046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,4,1,power_law_1.01,0.19814016342163085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,4,1,power_law_1.01,0.22670015335083007
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,4,1,power_law_1.01,0.22832511901855468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,4,1,power_law_1.01,0.24168512344360354
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,4,1,power_law_1.01,0.2365555191040039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,4,1,power_law_1.01,0.24618175506591794
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,4,1,power_law_1.01,0.2645471954345703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,4,1,power_law_1.01,3.098494567871094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,4,1,power_law_1.01,0.2901324844360352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.01,0.3098918342590332
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.01,0.3714995193481445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.01,0.43826110839843746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.01,0.5554361724853516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,4,1,power_law_1.01,3.853782348632812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.01,0.6665599822998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,4,1,power_law_1.2,0.050094079971313474
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.01,0.9229657745361328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.01,1.1937862396240235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,4,1,power_law_1.2,0.10969344139099121
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,4,1,power_law_1.2,0.14684032440185546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.01,1.7149945068359376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,4,1,power_law_1.2,0.28215232849121097
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,4,1,power_law_1.2,0.30215103149414063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.01,2.234062042236328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,4,1,power_law_1.2,0.325522575378418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,4,1,power_law_1.2,0.3406291198730469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.01,2.766645202636719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,4,1,power_law_1.2,0.07561088085174561
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,4,1,power_law_1.2,0.05242496013641358
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,4,1,power_law_1.2,0.3460160064697265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,4,1,power_law_1.2,0.343422737121582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,4,1,power_law_1.2,0.3922252655029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,4,1,power_law_1.2,0.40472064971923827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,4,1,power_law_1.2,0.2547135925292969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,4,1,power_law_1.2,0.45893695831298825
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,4,1,power_law_1.2,0.5448825454711914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,4,1,power_law_1.2,0.6480339050292969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,4,1,power_law_1.2,0.7924076843261718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,4,1,power_law_1.2,0.2971615982055664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,4,1,power_law_1.2,0.9895359802246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,4,1,power_law_1.2,0.3079148864746094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,4,1,power_law_1.2,1.3224601745605469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,4,1,power_law_1.2,0.043656959533691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,4,1,power_law_1.2,0.0484876823425293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,4,1,power_law_1.2,0.06284287929534912
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,4,1,power_law_1.2,1.7102316284179686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,4,1,power_law_1.2,0.08030400276184083
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,4,1,power_law_1.2,0.10775360107421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,4,1,power_law_1.2,0.3726335906982422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,4,1,power_law_1.2,0.35300159454345703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,4,1,power_law_1.2,0.16842111587524414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,4,1,power_law_1.2,0.1850387191772461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,4,1,power_law_1.2,2.4438706970214845
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,4,1,power_law_1.2,0.18548416137695312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,4,1,power_law_1.2,0.19165567398071287
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,4,1,power_law_1.2,0.19207935333251952
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,4,1,power_law_1.2,0.19886592864990232
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,4,1,power_law_1.2,0.2312153625488281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,4,1,power_law_1.2,0.2310041618347168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,4,1,power_law_1.2,0.2399705505371094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,4,1,power_law_1.2,0.24993408203124998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,4,1,power_law_1.2,3.1048901367187502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,4,1,power_law_1.2,0.25437696456909176
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,4,1,power_law_1.2,0.2764262390136719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,4,1,power_law_1.2,0.2901625633239746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,4,1,power_law_1.2,0.3116543960571289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,4,1,power_law_1.2,0.37987518310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,4,1,power_law_1.2,3.8344561767578127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,4,1,power_law_1.2,0.4436928176879883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,4,1,power_law_1.2,0.554901123046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,4,1,power_law_1.2,0.6840601348876953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,4,1,power_law_1.01,0.10161664009094237
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,4,1,power_law_1.01,0.12357695579528809
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,4,1,power_law_1.2,0.9350592041015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,4,1,power_law_1.01,0.1661222457885742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,4,1,power_law_1.2,1.1904223632812498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,4,1,power_law_1.01,0.33820735931396484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,4,1,power_law_1.01,0.4150086212158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,4,1,power_law_1.2,1.7293157958984373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,4,1,power_law_1.01,0.6748178863525391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,4,1,power_law_1.01,0.7387757110595703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,4,1,power_law_1.01,0.7975039672851563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,4,1,power_law_1.2,2.2478636169433592
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,4,1,power_law_1.01,0.823315200805664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,4,1,power_law_1.01,0.8386809539794922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,4,1,power_law_1.2,2.7576589965820313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,4,1,power_law_1.01,0.8712774658203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,4,1,power_law_1.01,0.9170713806152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,4,1,power_law_1.01,1.2972300720214842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,4,1,power_law_1.01,1.336747589111328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,4,1,power_law_1.01,1.3935411071777344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,4,1,power_law_1.01,1.4302983093261719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,4,1,power_law_1.01,1.508009033203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,4,1,power_law_1.01,1.6367391967773437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,4,1,power_law_1.01,1.7446617126464843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,4,1,power_law_1.01,1.988270721435547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,4,1,power_law_1.01,2.3247276306152345
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,4,1,power_law_1.01,2.958174743652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,4,1,power_law_1.01,0.07031680107116699
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,4,1,power_law_1.01,0.08897088050842286
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,4,1,power_law_1.01,3.655732421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,4,1,power_law_1.01,0.11292608261108399
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,4,1,power_law_1.01,0.17424768447875977
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,4,1,power_law_1.01,0.23501951217651368
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,4,1,power_law_1.01,0.3779449462890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,4,1,power_law_1.01,5.093419494628906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,4,1,power_law_1.01,0.4053945541381836
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,4,1,power_law_1.01,0.4307680130004883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,4,1,power_law_1.01,0.4466854476928711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,4,1,power_law_1.01,0.45666942596435545
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,4,1,power_law_1.01,0.46887935638427736
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,4,1,power_law_1.01,0.4806073760986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,4,1,power_law_1.01,6.4835986328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,4,1,power_law_1.01,0.5365311813354492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,4,1,power_law_1.01,0.5448326492309571
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,4,1,power_law_1.01,0.5521836853027343
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,4,1,power_law_1.01,0.5590841674804687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,4,1,power_law_1.01,0.5908243179321289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,4,1,power_law_1.01,0.6401554870605468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.01,0.6898957061767578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.01,0.7917689514160157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.01,0.9267417907714843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.01,1.1682291412353516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.01,1.4183955383300781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,4,1,power_law_1.01,9.664497680664063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,4,1,power_law_1.2,0.10332480430603028
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.01,1.9213516235351562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,4,1,power_law_1.2,0.10839296340942384
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,4,1,power_law_1.2,0.16470464706420898
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.01,2.4958714294433593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,4,1,power_law_1.2,0.2676959991455078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,4,1,power_law_1.2,0.3803526306152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,4,1,power_law_1.01,12.605823974609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,4,1,power_law_1.2,0.6709369659423828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.01,3.5072833251953126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,4,1,power_law_1.2,0.7442208099365234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,4,1,power_law_1.2,0.8157536315917969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,4,1,power_law_1.2,0.842941436767578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,4,1,power_law_1.2,0.8587462615966797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,4,1,power_law_1.2,0.9089228820800781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.01,4.4714047241210935
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,4,1,power_law_1.2,0.9420063781738282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,4,1,power_law_1.2,1.3622277832031249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,4,1,power_law_1.01,15.491192626953126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.01,5.5247021484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,4,1,power_law_1.2,1.3957011413574218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,4,1,power_law_1.2,1.4837791442871093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,4,1,power_law_1.2,1.515611572265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,4,1,power_law_1.2,1.5441548156738283
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,4,1,power_law_1.2,1.6632499694824219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,4,1,power_law_1.2,1.7605740356445314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,4,1,power_law_1.2,2.069441223144531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,4,1,power_law_1.2,2.3462803649902346
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,4,1,power_law_1.2,3.0264013671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,4,1,power_law_1.2,0.07331520080566406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,4,1,power_law_1.2,0.07833087921142579
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,4,1,power_law_1.2,3.7219738769531245
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,4,1,power_law_1.2,0.1104576015472412
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,4,1,power_law_1.2,0.1607980728149414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,4,1,power_law_1.2,0.2125606346130371
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,4,1,power_law_1.2,0.37482624053955077
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,4,1,power_law_1.2,0.4093759918212891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,4,1,power_law_1.2,5.094884338378906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,4,1,power_law_1.2,0.4395808029174805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,4,1,power_law_1.2,0.45829185485839846
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,4,1,power_law_1.2,0.46629055023193355
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,4,1,power_law_1.2,0.480775032043457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,4,1,power_law_1.2,0.49023616790771485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,4,1,power_law_1.2,0.5595372772216797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,4,1,power_law_1.2,6.545330810546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,4,1,power_law_1.2,0.5624703979492187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,4,1,power_law_1.2,0.5850425720214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,4,1,power_law_1.2,0.5968147277832031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,4,1,power_law_1.2,0.6200915145874023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,4,1,power_law_1.2,0.6544461059570312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,4,1,power_law_1.2,0.7127686309814453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,4,1,power_law_1.2,0.806640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,4,1,power_law_1.2,0.9416038513183593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,4,1,power_law_1.2,1.207697296142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,4,1,power_law_1.2,1.458572235107422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,4,1,power_law_1.2,9.529083251953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,4,1,power_law_1.2,1.9989517211914063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,4,1,power_law_1.01,0.14148096084594725
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,4,1,power_law_1.2,2.4923992919921876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,4,1,power_law_1.01,0.16925504684448242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,4,1,power_law_1.2,3.5490036010742188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,4,1,power_law_1.01,0.2446668815612793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,4,1,power_law_1.01,0.2840339279174805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,4,1,power_law_1.01,0.5601433563232422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,4,1,power_law_1.2,12.661866455078124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,4,1,power_law_1.2,4.5285272216796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,4,1,power_law_1.01,0.8014482879638672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,4,1,power_law_1.01,0.9543481445312499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,4,1,power_law_1.01,1.244040298461914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,4,1,power_law_1.01,1.317011260986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,4,1,power_law_1.2,5.579617309570312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,4,1,power_law_1.01,1.3662092590332031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,4,1,power_law_1.2,15.465394287109376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,4,1,power_law_1.01,1.4305024719238282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,4,1,power_law_1.01,1.4863058471679689
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,4,1,power_law_1.01,1.5280210876464844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,4,1,power_law_1.01,1.6304896545410155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,4,1,power_law_1.01,1.7124691772460938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,4,1,power_law_1.01,1.8099232482910157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,4,1,power_law_1.01,2.5374552917480466
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,4,1,power_law_1.01,2.7413241577148435
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,4,1,power_law_1.01,2.9126290893554687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,4,1,power_law_1.01,3.271285095214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,4,1,power_law_1.01,3.5896365356445314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,4,1,power_law_1.01,4.163749084472657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,4,1,power_law_1.01,0.09352191925048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,4,1,power_law_1.01,4.7439904785156255
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,4,1,power_law_1.01,0.1132800006866455
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,4,1,power_law_1.01,0.15752127647399902
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,4,1,power_law_1.01,0.1946668815612793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,4,1,power_law_1.01,5.90517822265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,4,1,power_law_1.01,0.34063358306884767
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,4,1,power_law_1.01,0.48226238250732417
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,4,1,power_law_1.01,0.5622086334228515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,4,1,power_law_1.01,0.7257612609863282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,4,1,power_law_1.01,7.28870361328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,4,1,power_law_1.01,0.7654463958740234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,4,1,power_law_1.01,0.7951910400390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,4,1,power_law_1.01,0.8256070709228516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,4,1,power_law_1.01,0.8493151855468749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,4,1,power_law_1.01,0.8753651428222657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,4,1,power_law_1.01,0.9029933166503905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,4,1,power_law_1.01,0.925265884399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,4,1,power_law_1.01,0.9477715301513673
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,4,1,power_law_1.01,10.509246826171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,4,1,power_law_1.01,1.0972537231445312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,4,1,power_law_1.01,1.1488735961914063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.01,1.2127423858642579
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.01,1.3136755371093751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.01,1.4389637756347657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.01,1.6809779357910155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,4,1,power_law_1.01,13.288157958984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.01,1.9450720214843749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.01,2.5124914550781248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,4,1,power_law_1.2,0.13691136360168457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,4,1,power_law_1.2,0.16995647430419922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.01,2.9712921142578126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,4,1,power_law_1.2,0.20214656829833982
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,4,1,power_law_1.2,0.2910092735290527
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,4,1,power_law_1.2,0.499046401977539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,4,1,power_law_1.01,16.166068115234374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.01,4.015647277832032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,4,1,power_law_1.2,0.7390271759033202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,4,1,power_law_1.2,0.8436249542236329
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,4,1,power_law_1.2,1.1864288330078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,4,1,power_law_1.2,1.2483430480957032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.01,5.125049438476562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,4,1,power_law_1.2,1.3105535888671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,4,1,power_law_1.2,1.39732666015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,4,1,power_law_1.2,1.4632640075683594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,4,1,power_law_1.2,1.4992697143554687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.01,6.2784704589843745
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,4,1,power_law_1.2,1.623540496826172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,4,1,power_law_1.2,1.7358944702148438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,4,1,power_law_1.2,1.8547161865234376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,4,1,power_law_1.2,2.5517837524414064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,4,1,power_law_1.2,2.7893572998046876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,4,1,power_law_1.2,3.007684631347656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,4,1,power_law_1.2,3.3751898193359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,4,1,power_law_1.2,3.7352005004882813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,4,1,power_law_1.2,4.346144714355469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,4,1,power_law_1.2,0.09342144012451173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,4,1,power_law_1.2,4.936499328613282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,4,1,power_law_1.2,0.11421183586120605
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,4,1,power_law_1.2,0.13480064392089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,4,1,power_law_1.2,6.166959838867188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,4,1,power_law_1.2,0.19556928634643556
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,4,1,power_law_1.2,0.3035519981384277
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,4,1,power_law_1.2,0.42768512725830077
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,4,1,power_law_1.2,0.5025196838378906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,4,1,power_law_1.2,0.6927059173583985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,4,1,power_law_1.2,0.7164205169677734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,4,1,power_law_1.2,7.5165252685546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,4,1,power_law_1.2,0.7661228942871093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,4,1,power_law_1.2,0.8018905639648437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,4,1,power_law_1.2,0.8303327941894532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,4,1,power_law_1.2,0.8519417572021485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,4,1,power_law_1.2,0.8916812896728515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,4,1,power_law_1.2,0.9121798706054687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,4,1,power_law_1.2,10.573045654296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,4,1,power_law_1.2,0.9466700744628905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,4,1,power_law_1.2,1.1030143737792968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,4,1,power_law_1.2,1.1675443267822265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,4,1,power_law_1.2,1.2491046142578124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,4,1,power_law_1.2,1.3910751342773438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,4,1,power_law_1.2,1.5088787841796876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,4,1,power_law_1.2,1.8025733947753906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,4,1,power_law_1.2,2.068078765869141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,4,1,power_law_1.2,13.556658935546874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,4,1,power_law_1.2,2.5779852294921874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,4,1,power_law_1.2,3.1062106323242187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,4,1,power_law_1.2,4.168179321289062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,4,1,power_law_1.2,16.1682275390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,8,1,power_law_1.01,0.06569024085998534
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,8,1,power_law_1.01,0.08070015907287598
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,8,1,power_law_1.01,0.11699328422546387
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,8,1,power_law_1.01,0.047109122276306155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,4,1,power_law_1.2,5.18878173828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,8,1,power_law_1.01,0.11563648223876952
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,8,1,power_law_1.01,0.11433600425720214
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,8,1,power_law_1.01,0.1502988815307617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,4,1,power_law_1.2,6.439725952148438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,8,1,power_law_1.01,0.10875583648681642
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,8,1,power_law_1.01,0.1097977638244629
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,8,1,power_law_1.01,0.17969024658203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,8,1,power_law_1.01,0.20621759414672852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,8,1,power_law_1.01,0.11069631576538086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,8,1,power_law_1.01,0.13470208168029785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,8,1,power_law_1.01,0.2598086357116699
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,8,1,power_law_1.01,0.34576766967773437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,8,1,power_law_1.01,0.16420223236083983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,8,1,power_law_1.01,0.11853759765625001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,8,1,power_law_1.01,0.3887871932983399
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,8,1,power_law_1.01,0.5397926330566406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,8,1,power_law_1.01,0.13486656188964843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,8,1,power_law_1.01,0.7426163482666015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,8,1,power_law_1.01,0.17680896759033202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,8,1,power_law_1.01,1.0453632354736329
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,8,1,power_law_1.01,0.14286016464233398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,8,1,power_law_1.01,2.0230560302734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,8,1,power_law_1.01,2.6989202880859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,8,1,power_law_1.01,3.3453964233398437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,8,1,power_law_1.01,0.04563583850860596
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,8,1,power_law_1.01,1.3904646301269532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,8,1,power_law_1.01,0.03522495985031128
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,8,1,power_law_1.01,0.07726975917816162
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,8,1,power_law_1.01,0.051521282196044925
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,8,1,power_law_1.01,0.08515456199645996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,8,1,power_law_1.01,0.09013567924499512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,8,1,power_law_1.01,0.09769151687622071
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,8,1,power_law_1.01,0.06981376171112061
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,8,1,power_law_1.01,0.088787841796875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,8,1,power_law_1.01,0.10873791694641113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,8,1,power_law_1.01,0.07063551902770995
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,8,1,power_law_1.01,0.14439552307128906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.01,0.15904831886291504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.01,0.20941696166992188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,8,1,power_law_1.01,0.07107135772705078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,8,1,power_law_1.01,0.07226240158081054
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.01,0.33744705200195313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,8,1,power_law_1.01,0.07283199787139892
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.01,0.43424190521240236
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,8,1,power_law_1.01,0.07329472064971923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.01,0.6127648162841797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.01,1.257470703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,8,1,power_law_1.2,0.046730241775512694
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.01,1.728314208984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.01,2.099584045410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,8,1,power_law_1.01,0.10224063873291016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,8,1,power_law_1.01,0.11116095542907715
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,8,1,power_law_1.2,0.10991680145263671
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,8,1,power_law_1.2,0.06504576206207276
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,8,1,power_law_1.2,0.10494400024414063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,8,1,power_law_1.2,0.1018560028076172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,8,1,power_law_1.2,0.0724012804031372
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,8,1,power_law_1.2,0.11954431533813477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,8,1,power_law_1.2,0.11088255882263183
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,8,1,power_law_1.2,0.1476863956451416
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,8,1,power_law_1.2,0.1087622356414795
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.01,0.2403264045715332
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,8,1,power_law_1.2,0.1790892791748047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,8,1,power_law_1.2,0.1813088035583496
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,8,1,power_law_1.2,0.20281408309936522
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,8,1,power_law_1.2,0.2632255935668945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,8,1,power_law_1.2,0.3140127944946289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,8,1,power_law_1.2,0.11138239860534668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.01,0.854408950805664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,8,1,power_law_1.2,0.388513298034668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,8,1,power_law_1.2,0.1523961639404297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,8,1,power_law_1.2,0.5482278442382812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,8,1,power_law_1.2,0.7358573150634766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,8,1,power_law_1.2,1.069713897705078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,8,1,power_law_1.2,1.3941075134277345
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,8,1,power_law_1.2,0.13830080032348632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,8,1,power_law_1.2,0.14794303894042968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,8,1,power_law_1.2,2.0265126037597656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,8,1,power_law_1.2,0.1336844825744629
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,8,1,power_law_1.2,0.07097087860107422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,8,1,power_law_1.2,0.07365568161010742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,8,1,power_law_1.2,2.744005126953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,8,1,power_law_1.2,3.401533508300781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,8,1,power_law_1.2,0.07969279766082764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,8,1,power_law_1.2,0.08795328140258789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,8,1,power_law_1.2,0.09300928115844727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,8,1,power_law_1.2,0.0965779209136963
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,8,1,power_law_1.2,0.08941760063171386
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,8,1,power_law_1.2,0.044326400756835936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,8,1,power_law_1.2,0.09938559532165528
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,8,1,power_law_1.2,0.11253824234008789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,8,1,power_law_1.2,0.03562175989151001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,8,1,power_law_1.2,0.07188992023468017
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,8,1,power_law_1.2,0.14233152389526366
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,8,1,power_law_1.2,0.07318912029266358
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,8,1,power_law_1.2,0.15864383697509765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,8,1,power_law_1.2,0.19542272567749025
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,8,1,power_law_1.2,0.24025983810424806
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,8,1,power_law_1.2,0.06982719898223877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,8,1,power_law_1.2,0.33420032501220703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,8,1,power_law_1.2,0.050481920242309575
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,8,1,power_law_1.2,0.43923904418945314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,8,1,power_law_1.2,0.0712614393234253
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,8,1,power_law_1.2,0.6282368087768555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,8,1,power_law_1.01,0.08838656425476074
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,8,1,power_law_1.2,0.8208959960937501
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,8,1,power_law_1.01,0.11049535751342773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,8,1,power_law_1.2,1.2371148681640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,8,1,power_law_1.2,1.7120895385742188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,8,1,power_law_1.2,2.123679962158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,8,1,power_law_1.2,0.11048255920410158
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,8,1,power_law_1.01,0.1628563117980957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,8,1,power_law_1.01,0.06055679798126221
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,8,1,power_law_1.01,0.16916032791137697
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,8,1,power_law_1.01,0.17769599914550782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,8,1,power_law_1.01,0.2504038429260254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,8,1,power_law_1.01,0.24952384948730472
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,8,1,power_law_1.01,0.17203712463378906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,8,1,power_law_1.01,0.258337287902832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,8,1,power_law_1.01,0.26537599563598635
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,8,1,power_law_1.01,0.17041919708251954
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,8,1,power_law_1.01,0.3659193420410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,8,1,power_law_1.01,0.17171775817871093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,8,1,power_law_1.01,0.3739315032958984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,8,1,power_law_1.01,0.5073791885375977
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,8,1,power_law_1.01,0.6296531295776366
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,8,1,power_law_1.01,0.9305030059814452
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,8,1,power_law_1.01,0.17949567794799806
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,8,1,power_law_1.01,1.2041190338134764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,8,1,power_law_1.01,0.19175487518310547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,8,1,power_law_1.01,1.786363525390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,8,1,power_law_1.01,0.1888275146484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,8,1,power_law_1.01,0.19378751754760742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,8,1,power_law_1.01,2.265411834716797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,8,1,power_law_1.01,0.09884480476379395
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,8,1,power_law_1.01,0.10215999603271483
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,8,1,power_law_1.01,0.10337471961975098
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,8,1,power_law_1.01,0.10275584220886232
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,8,1,power_law_1.01,0.10416895866394042
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,8,1,power_law_1.01,3.3658502197265627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,8,1,power_law_1.01,0.10796928405761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,8,1,power_law_1.01,0.11653696060180666
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,8,1,power_law_1.01,0.11482687950134278
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,8,1,power_law_1.01,0.11993023872375488
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,8,1,power_law_1.01,0.1364345645904541
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,8,1,power_law_1.01,0.14608384132385255
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,8,1,power_law_1.01,4.474830017089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,8,1,power_law_1.01,0.1558739185333252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,8,1,power_law_1.01,0.16316799163818357
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,8,1,power_law_1.01,0.2123871994018555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.01,0.224835205078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,8,1,power_law_1.01,0.07079296112060547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.01,0.2997318458557129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,8,1,power_law_1.01,5.560659790039063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.01,0.37609985351562497
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.01,0.5302937698364258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.01,0.660873565673828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.01,1.0190374755859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,8,1,power_law_1.01,0.10088768005371093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.01,1.3389715576171874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.01,1.9892115783691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,8,1,power_law_1.01,0.04691775798797607
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.01,2.645619201660156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.01,3.478092041015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,8,1,power_law_1.2,0.17492544174194335
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,8,1,power_law_1.01,0.06188096046447754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,8,1,power_law_1.2,0.1708608055114746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,8,1,power_law_1.2,0.1740185546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,8,1,power_law_1.2,0.09547455787658692
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,8,1,power_law_1.2,0.08430335998535157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,8,1,power_law_1.2,0.1818284797668457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,8,1,power_law_1.2,0.25033983230590817
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,8,1,power_law_1.2,0.1633011245727539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,8,1,power_law_1.2,0.059991679191589355
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,8,1,power_law_1.2,0.2504249572753906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,8,1,power_law_1.2,0.2629062461853027
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,8,1,power_law_1.2,0.2661030387878418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,8,1,power_law_1.2,0.3486816024780274
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,8,1,power_law_1.2,0.37484737396240236
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,8,1,power_law_1.2,0.5103174209594726
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,8,1,power_law_1.2,0.16219648361206054
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,8,1,power_law_1.2,0.6333248138427734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,8,1,power_law_1.2,0.9334457397460938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,8,1,power_law_1.2,0.1867616081237793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,8,1,power_law_1.2,1.203362579345703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,8,1,power_law_1.2,1.7901951599121095
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,8,1,power_law_1.2,0.05003327846527099
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,8,1,power_law_1.2,2.303877716064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,8,1,power_law_1.2,0.19079872131347658
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,8,1,power_law_1.2,0.1941702461242676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,8,1,power_law_1.2,0.19016128540039062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,8,1,power_law_1.2,0.09907008171081542
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,8,1,power_law_1.2,0.09763392448425293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,8,1,power_law_1.2,0.10201279640197754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,8,1,power_law_1.2,0.10369471549987792
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,8,1,power_law_1.2,0.10273280143737792
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,8,1,power_law_1.2,0.10504063606262207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,8,1,power_law_1.2,0.10902015686035156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,8,1,power_law_1.2,0.11633024215698243
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,8,1,power_law_1.2,0.11715519905090332
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,8,1,power_law_1.2,0.13735360145568848
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,8,1,power_law_1.2,3.4074221801757814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,8,1,power_law_1.2,0.14473792076110842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,8,1,power_law_1.2,0.1577196788787842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,8,1,power_law_1.2,0.20159423828124998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,8,1,power_law_1.2,0.1628998374938965
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,8,1,power_law_1.2,0.21979583740234374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,8,1,power_law_1.2,0.29361087799072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,8,1,power_law_1.2,0.37663169860839846
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,8,1,power_law_1.2,4.483722229003907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,8,1,power_law_1.2,0.5136127853393555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,8,1,power_law_1.2,0.6551219177246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,8,1,power_law_1.2,0.06835584163665771
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,8,1,power_law_1.2,1.025909729003906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,8,1,power_law_1.2,5.571343994140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,8,1,power_law_1.2,1.3472537231445312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,8,1,power_law_1.01,0.1023641586303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,8,1,power_law_1.01,0.11541312217712403
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,8,1,power_law_1.01,0.12397952079772949
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,8,1,power_law_1.2,1.9714950561523437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,8,1,power_law_1.2,0.11404352188110352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,8,1,power_law_1.01,0.1804300880432129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,8,1,power_law_1.01,0.2696147155761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,8,1,power_law_1.2,2.6891213989257814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,8,1,power_law_1.01,0.42200065612792964
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,8,1,power_law_1.01,0.5006732940673828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,8,1,power_law_1.01,0.5173734283447265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,8,1,power_law_1.2,3.264602966308594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,8,1,power_law_1.01,0.535293426513672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,8,1,power_law_1.01,0.5473932647705079
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,8,1,power_law_1.01,0.6570175933837891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,8,1,power_law_1.01,0.6014649581909179
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,8,1,power_law_1.01,0.6595046234130859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,8,1,power_law_1.01,0.6800685119628906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,8,1,power_law_1.01,0.9246975708007813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,8,1,power_law_1.2,0.058950400352478026
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,8,1,power_law_1.01,0.8965382385253907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,8,1,power_law_1.01,0.9778572845458985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,8,1,power_law_1.01,1.0666175842285157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,8,1,power_law_1.01,1.1687193298339844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,8,1,power_law_1.01,1.2954258728027344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,8,1,power_law_1.01,1.4788479614257812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,8,1,power_law_1.01,1.8193927001953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,8,1,power_law_1.01,2.166983642578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,8,1,power_law_1.01,0.06742784023284912
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,8,1,power_law_1.01,0.07961023807525634
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,8,1,power_law_1.01,0.08621503829956054
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,8,1,power_law_1.01,2.9134381103515627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,8,1,power_law_1.01,0.1271846389770508
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,8,1,power_law_1.01,3.7068249511718747
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,8,1,power_law_1.01,0.19177087783813476
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,8,1,power_law_1.01,0.23649599075317385
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,8,1,power_law_1.01,0.3279673767089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,8,1,power_law_1.01,0.3394393539428711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,8,1,power_law_1.01,0.35262401580810543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,8,1,power_law_1.01,0.36191616058349607
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,8,1,power_law_1.01,0.37991168975830075
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,8,1,power_law_1.01,5.244859008789062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,8,1,power_law_1.01,0.4001171112060547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,8,1,power_law_1.01,0.4114400100708008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,8,1,power_law_1.01,0.42322368621826173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,8,1,power_law_1.01,0.5130041503906251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,8,1,power_law_1.01,0.5162464141845703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,8,1,power_law_1.01,0.5329715347290038
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,8,1,power_law_1.01,0.5601318359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,8,1,power_law_1.01,6.833892211914062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.01,0.5933427047729493
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.01,0.6913555145263672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.01,0.7506861114501954
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.01,0.9246208190917968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,8,1,power_law_1.01,8.198101806640626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.01,1.1072889709472657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,8,1,power_law_1.2,0.10233087539672851
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.01,1.4500851440429687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,8,1,power_law_1.2,0.11547712326049804
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,8,1,power_law_1.2,0.11857279777526855
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.01,1.8252178955078127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,8,1,power_law_1.2,0.16952512741088868
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,8,1,power_law_1.2,0.24600959777832032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,8,1,power_law_1.2,0.35498111724853515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,8,1,power_law_1.2,0.484587516784668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.01,2.576514587402344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,8,1,power_law_1.2,0.5130847930908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,8,1,power_law_1.2,0.5286899185180663
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,8,1,power_law_1.2,0.548263053894043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.01,3.3240588378906253
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,8,1,power_law_1.2,0.6274848175048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,8,1,power_law_1.2,0.6527232360839844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,8,1,power_law_1.2,0.6659986877441406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,8,1,power_law_1.2,0.7016371154785157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,8,1,power_law_1.2,0.9235199737548829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.01,3.9747564697265623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,8,1,power_law_1.2,0.9569107055664062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,8,1,power_law_1.2,1.0162579345703127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,8,1,power_law_1.2,1.1496147155761718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,8,1,power_law_1.2,1.2206130981445313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,8,1,power_law_1.2,1.3786810302734376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,8,1,power_law_1.2,1.5306182861328126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,8,1,power_law_1.2,1.858853759765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,8,1,power_law_1.2,0.06713791847229003
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,8,1,power_law_1.2,2.221240997314453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,8,1,power_law_1.2,0.07990911960601807
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,8,1,power_law_1.2,0.08281536102294922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,8,1,power_law_1.2,2.9698092651367185
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,8,1,power_law_1.2,0.11949312210083007
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,8,1,power_law_1.2,0.18136703491210937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,8,1,power_law_1.2,0.21914880752563476
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,8,1,power_law_1.2,0.3207321548461914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,8,1,power_law_1.2,0.33795646667480467
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,8,1,power_law_1.2,3.7669491577148433
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,8,1,power_law_1.2,0.3478604888916016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,8,1,power_law_1.2,0.3569184112548828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,8,1,power_law_1.2,0.37878273010253904
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,8,1,power_law_1.2,0.40442623138427736
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,8,1,power_law_1.2,0.4140703964233398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,8,1,power_law_1.2,0.43089473724365235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,8,1,power_law_1.2,5.204638671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,8,1,power_law_1.2,0.5169382476806641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,8,1,power_law_1.2,0.5302521514892578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,8,1,power_law_1.2,0.5438835144042968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,8,1,power_law_1.2,0.5955615997314453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,8,1,power_law_1.2,0.64970947265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,8,1,power_law_1.2,0.7224134063720703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,8,1,power_law_1.2,0.7962201690673828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,8,1,power_law_1.2,6.819700317382813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,8,1,power_law_1.2,0.9648108673095702
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,8,1,power_law_1.2,1.1346336364746095
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,8,1,power_law_1.2,1.474929962158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,8,1,power_law_1.01,0.048010878562927246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,8,1,power_law_1.2,8.403050537109376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,8,1,power_law_1.01,0.058305277824401855
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,8,1,power_law_1.2,1.8526765441894533
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,8,1,power_law_1.01,0.1666867256164551
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,8,1,power_law_1.2,2.5543174743652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,8,1,power_law_1.01,0.07498303890228272
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,8,1,power_law_1.01,0.03887936115264893
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,8,1,power_law_1.01,0.16275648117065428
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,8,1,power_law_1.2,3.389584045410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,8,1,power_law_1.01,0.14194687843322754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,8,1,power_law_1.01,0.21206272125244138
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,8,1,power_law_1.01,0.2227251243591309
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,8,1,power_law_1.2,4.028193359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,8,1,power_law_1.01,0.09921343803405762
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,8,1,power_law_1.01,0.22766016006469725
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,8,1,power_law_1.01,0.23288511276245116
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,8,1,power_law_1.01,0.24364736557006833
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,8,1,power_law_1.01,0.15816831588745117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,8,1,power_law_1.01,0.33177406311035157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,8,1,power_law_1.01,0.37483264923095705
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,8,1,power_law_1.01,0.40705726623535154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,8,1,power_law_1.01,0.16810111999511718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,8,1,power_law_1.01,0.6563398742675781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,8,1,power_law_1.01,0.1981760025024414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,8,1,power_law_1.01,0.2056300735473633
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,8,1,power_law_1.01,0.906561279296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,8,1,power_law_1.01,0.035879681110382075
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,8,1,power_law_1.01,1.1464697265625001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,8,1,power_law_1.01,0.04951871871948242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,8,1,power_law_1.01,0.06051648139953614
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,8,1,power_law_1.01,0.07112639904022217
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,8,1,power_law_1.01,1.6689900207519532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,8,1,power_law_1.01,0.09536895751953126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,8,1,power_law_1.01,0.2592300796508789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,8,1,power_law_1.01,0.10541888236999512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,8,1,power_law_1.01,0.10823552131652832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,8,1,power_law_1.01,2.133756103515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,8,1,power_law_1.01,0.1106879997253418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,8,1,power_law_1.01,0.11295616149902343
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,8,1,power_law_1.01,0.12257599830627441
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,8,1,power_law_1.01,0.12835583686828614
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,8,1,power_law_1.01,0.13364864349365235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,8,1,power_law_1.01,2.6053869628906248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,8,1,power_law_1.01,0.14607104301452636
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,8,1,power_law_1.01,0.5433772659301758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,8,1,power_law_1.01,0.16730815887451173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,8,1,power_law_1.01,0.17786943435668945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,8,1,power_law_1.01,0.19435712814331055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.01,0.7250605010986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,8,1,power_law_1.01,0.041146240234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.01,0.9218278503417968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,8,1,power_law_1.01,0.1714022445678711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.01,1.3260012817382811
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,8,1,power_law_1.2,0.04063551902770996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.01,0.3093222427368164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.01,0.4331379318237305
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.01,0.2879974365234375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,8,1,power_law_1.2,0.046709117889404295
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,8,1,power_law_1.2,0.05577023983001709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,8,1,power_law_1.2,0.07035903930664063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.01,0.21138624191284178
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.01,0.5181516647338867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,8,1,power_law_1.2,0.08925632476806641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,8,1,power_law_1.2,0.16815168380737305
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,8,1,power_law_1.2,0.1606649589538574
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.01,1.7304165649414063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,8,1,power_law_1.2,0.1659846305847168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,8,1,power_law_1.2,0.20059520721435548
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,8,1,power_law_1.2,0.20881727218627927
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,8,1,power_law_1.2,0.2146847915649414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,8,1,power_law_1.2,0.2242252731323242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,8,1,power_law_1.2,0.23071680068969727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,8,1,power_law_1.2,0.2348934364318848
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,8,1,power_law_1.2,0.24396991729736328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,8,1,power_law_1.2,0.26053056716918943
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,8,1,power_law_1.2,0.14409791946411132
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,8,1,power_law_1.2,0.3357702255249023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,8,1,power_law_1.2,0.38926849365234373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,8,1,power_law_1.2,0.5463257598876953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,8,1,power_law_1.2,0.673617935180664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,8,1,power_law_1.2,0.914682846069336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,8,1,power_law_1.2,1.154272003173828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,8,1,power_law_1.2,0.03573312044143677
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,8,1,power_law_1.2,0.17038911819458008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,8,1,power_law_1.2,0.0475878381729126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,8,1,power_law_1.2,1.6440698242187501
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,8,1,power_law_1.2,0.05836800098419189
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,8,1,power_law_1.2,0.06800255775451661
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,8,1,power_law_1.2,0.09853759765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,8,1,power_law_1.2,0.10668864250183105
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,8,1,power_law_1.2,0.10944064140319824
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,8,1,power_law_1.2,2.1511795043945314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,8,1,power_law_1.2,0.11332032203674317
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,8,1,power_law_1.2,0.11598208427429199
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.01,2.131582794189453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,8,1,power_law_1.2,0.12365568161010743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,8,1,power_law_1.2,0.12919615745544433
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,8,1,power_law_1.2,0.13658944129943848
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,8,1,power_law_1.2,2.6283718872070314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,8,1,power_law_1.2,0.1479980754852295
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,8,1,power_law_1.2,0.16838016510009765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,8,1,power_law_1.2,0.4070457458496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,8,1,power_law_1.2,0.18013120651245118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,8,1,power_law_1.2,0.19641664505004883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,8,1,power_law_1.2,0.3107948875427246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,8,1,power_law_1.2,0.5293900680541992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,8,1,power_law_1.2,0.7288358306884766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,8,1,power_law_1.2,0.0409119987487793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,8,1,power_law_1.2,0.9248281860351563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,8,1,power_law_1.01,0.08781503677368165
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,8,1,power_law_1.2,1.3285900878906252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,8,1,power_law_1.01,0.09704511642456055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,8,1,power_law_1.2,0.17391807556152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,8,1,power_law_1.01,0.1143660831451416
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,8,1,power_law_1.2,1.7337811279296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,8,1,power_law_1.01,0.16962623596191406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,8,1,power_law_1.01,0.2258380889892578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,8,1,power_law_1.2,0.4342246246337891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,8,1,power_law_1.01,0.38408832550048827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,8,1,power_law_1.2,2.1466387939453124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,8,1,power_law_1.01,0.4115558242797851
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,8,1,power_law_1.2,0.29510080337524414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,8,1,power_law_1.01,0.4207929611206055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,8,1,power_law_1.2,0.21336063385009765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,8,1,power_law_1.01,0.43660736083984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,8,1,power_law_1.01,0.4487609481811523
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,8,1,power_law_1.01,0.48447231292724613
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,8,1,power_law_1.01,0.5223724746704101
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,8,1,power_law_1.01,0.6855001831054688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,8,1,power_law_1.01,0.6965670776367188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,8,1,power_law_1.01,0.7131053161621094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,8,1,power_law_1.01,0.727027816772461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,8,1,power_law_1.01,0.7732173156738281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,8,1,power_law_1.01,0.8495839691162109
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,8,1,power_law_1.01,0.9149759674072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,8,1,power_law_1.01,1.0439033508300781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,8,1,power_law_1.01,1.2281241607666016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,8,1,power_law_1.01,1.5978930664062498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,8,1,power_law_1.01,1.9853228759765624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,8,1,power_law_1.01,2.8038143920898437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,8,1,power_law_1.01,3.60076416015625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,8,1,power_law_1.01,0.060866560935974125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,8,1,power_law_1.01,0.07028287887573242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,8,1,power_law_1.01,0.08463040351867676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,8,1,power_law_1.01,0.26101055145263674
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,8,1,power_law_1.01,5.183381347656249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,8,1,power_law_1.01,0.2735955238342285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,8,1,power_law_1.01,0.2809375953674317
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,8,1,power_law_1.01,0.1195641613006592
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,8,1,power_law_1.01,0.29437503814697263
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,8,1,power_law_1.01,6.695479736328124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,8,1,power_law_1.01,0.30220991134643554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,8,1,power_law_1.01,0.16309183120727538
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,8,1,power_law_1.01,0.24805503845214844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,8,1,power_law_1.01,8.417412719726562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,8,1,power_law_1.01,0.2872729682922363
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,8,1,power_law_1.01,0.3799884796142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,8,1,power_law_1.01,0.38609920501708983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,8,1,power_law_1.01,0.3913811111450195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,8,1,power_law_1.01,0.3969535827636719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,8,1,power_law_1.01,0.4130681610107422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,8,1,power_law_1.01,0.4487225723266602
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.01,0.6712397003173829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.01,0.8634496307373046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.01,1.0401216125488282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.01,1.4533164978027344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.01,0.5057855987548828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,8,1,power_law_1.2,0.0876518440246582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.01,0.5670860671997071
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.01,1.8210047912597656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,8,1,power_law_1.2,0.09016896247863769
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,8,1,power_law_1.2,0.11340928077697754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,8,1,power_law_1.2,0.15543423652648927
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,8,1,power_law_1.2,0.20433536529541016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,8,1,power_law_1.2,0.38583873748779296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,8,1,power_law_1.2,0.40637119293212887
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.01,2.6541497802734377
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,8,1,power_law_1.2,0.42705665588378905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,8,1,power_law_1.2,0.45193729400634763
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,8,1,power_law_1.2,0.4649862289428711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,8,1,power_law_1.2,0.5203001785278321
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,8,1,power_law_1.2,0.5371692657470704
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.01,3.4034054565429686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,8,1,power_law_1.2,0.7037337493896485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,8,1,power_law_1.2,0.7165491485595703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,8,1,power_law_1.2,0.7383065795898437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,8,1,power_law_1.2,0.7586291503906251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,8,1,power_law_1.2,0.7957523345947266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,8,1,power_law_1.2,0.8769446563720702
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,8,1,power_law_1.2,0.9249497222900391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.01,4.182297058105469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,8,1,power_law_1.2,1.0778291320800781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,8,1,power_law_1.2,1.254813461303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,8,1,power_law_1.2,1.6056690979003907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,8,1,power_law_1.2,2.01154052734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,8,1,power_law_1.2,0.08375935554504395
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,8,1,power_law_1.2,2.8057644653320315
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,8,1,power_law_1.2,0.11000000000000001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,8,1,power_law_1.2,0.14848959922790528
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,8,1,power_law_1.2,3.6107705688476566
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,8,1,power_law_1.2,0.24507328033447268
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,8,1,power_law_1.2,0.06066880226135254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,8,1,power_law_1.2,0.2643507194519043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,8,1,power_law_1.2,0.06469759941101075
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,8,1,power_law_1.2,0.2790470314025879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,8,1,power_law_1.2,0.28844160079956055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,8,1,power_law_1.2,0.30249792098999023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,8,1,power_law_1.2,0.30946687698364256
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,8,1,power_law_1.2,0.3902252960205078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,8,1,power_law_1.2,5.192710571289062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,8,1,power_law_1.2,0.39454910278320315
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,8,1,power_law_1.2,0.4048921585083008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,8,1,power_law_1.2,0.41084224700927735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,8,1,power_law_1.2,0.4283712005615234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,8,1,power_law_1.2,0.47837566375732427
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,8,1,power_law_1.2,0.5129695892333984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,8,1,power_law_1.2,6.76703857421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,8,1,power_law_1.2,0.6037638473510742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,8,1,power_law_1.2,0.6740351867675781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,8,1,power_law_1.2,0.2930899238586426
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,8,1,power_law_1.2,0.889257583618164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,8,1,power_law_1.2,1.0628192138671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,8,1,power_law_1.2,8.437302856445312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,8,1,power_law_1.2,1.4509631347656249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,8,1,power_law_1.01,0.12462656021118164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,8,1,power_law_1.2,1.8412800598144532
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,8,1,power_law_1.01,0.13745792388916017
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,8,1,power_law_1.01,0.17226367950439453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,8,1,power_law_1.01,0.1887603187561035
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,8,1,power_law_1.01,0.31851839065551757
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,8,1,power_law_1.2,2.6401422119140627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,8,1,power_law_1.01,0.4735078430175781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,8,1,power_law_1.01,0.5195711898803711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,8,1,power_law_1.01,0.6890796661376953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,8,1,power_law_1.2,3.4274777221679686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,8,1,power_law_1.01,0.7169190216064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,8,1,power_law_1.01,0.7354137420654296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,8,1,power_law_1.01,0.7700608062744141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,8,1,power_law_1.2,4.243570556640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,8,1,power_law_1.01,0.7900998687744141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,8,1,power_law_1.01,0.8204077148437501
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,8,1,power_law_1.01,0.8932972717285157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,8,1,power_law_1.01,0.923096923828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,8,1,power_law_1.01,0.9662163543701172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,8,1,power_law_1.01,1.3316088867187499
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,8,1,power_law_1.01,1.3938117980957032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,8,1,power_law_1.01,1.4917887878417968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,8,1,power_law_1.01,1.7141075134277344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,8,1,power_law_1.01,1.8792134094238282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,8,1,power_law_1.01,2.2833351135253905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,8,1,power_law_1.01,0.08377344131469726
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,8,1,power_law_1.01,2.6654739379882812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,8,1,power_law_1.01,0.09567872047424317
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,8,1,power_law_1.01,3.304227905273437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,8,1,power_law_1.01,0.11788800239562988
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,8,1,power_law_1.01,0.13064064025878905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,8,1,power_law_1.01,0.2234169578552246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,8,1,power_law_1.01,4.076590576171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,8,1,power_law_1.01,0.30773120880126953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,8,1,power_law_1.01,0.3427980804443359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,8,1,power_law_1.01,0.4377740859985352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,8,1,power_law_1.01,0.4587392044067383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,8,1,power_law_1.01,0.4782400131225586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,8,1,power_law_1.01,0.5039635086059571
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,8,1,power_law_1.01,5.5930023193359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,8,1,power_law_1.01,0.5166035079956055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,8,1,power_law_1.01,0.5315577697753906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,8,1,power_law_1.01,0.5525555038452149
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,8,1,power_law_1.01,0.5712319946289062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,8,1,power_law_1.01,0.580398712158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,8,1,power_law_1.01,0.7103424072265625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,8,1,power_law_1.01,0.7439142608642578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,8,1,power_law_1.01,7.285309448242188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.01,0.7842809295654296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.01,0.8774995422363281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.01,0.9617785644531249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.01,1.134667510986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,8,1,power_law_1.01,9.11561279296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.01,1.3158892822265624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.01,1.6961209106445314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,8,1,power_law_1.2,0.12485183715820311
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,8,1,power_law_1.2,0.1383033561706543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.01,2.0858393859863282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,8,1,power_law_1.2,0.15160832405090333
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,8,1,power_law_1.2,0.18906047821044922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,8,1,power_law_1.2,0.2877900886535644
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.01,2.8480569458007814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,8,1,power_law_1.2,0.4571187210083008
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,8,1,power_law_1.2,0.4834355163574219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,8,1,power_law_1.2,0.676200942993164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,8,1,power_law_1.2,0.6953004455566406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.01,3.6429953002929687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,8,1,power_law_1.2,0.7160704040527344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,8,1,power_law_1.2,0.7545446777343751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,8,1,power_law_1.2,0.7808979034423829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,8,1,power_law_1.2,0.8114534759521485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,8,1,power_law_1.2,0.882644500732422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.01,4.426679077148437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,8,1,power_law_1.2,0.9234636688232423
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,8,1,power_law_1.2,0.9829766082763672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,8,1,power_law_1.2,1.3248191833496095
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,8,1,power_law_1.2,1.4228070068359375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,8,1,power_law_1.2,1.550287322998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,8,1,power_law_1.2,1.7685536193847657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,8,1,power_law_1.2,1.9500250244140624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,8,1,power_law_1.2,2.363242950439453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,8,1,power_law_1.2,0.0833516788482666
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,8,1,power_law_1.2,2.709597473144531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,8,1,power_law_1.2,0.09667840003967285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,8,1,power_law_1.2,3.3972363281249995
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,8,1,power_law_1.2,0.10796095848083495
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,8,1,power_law_1.2,0.13347200393676756
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,8,1,power_law_1.2,0.20666303634643554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,8,1,power_law_1.2,4.162199707031251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,8,1,power_law_1.2,0.270068473815918
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,8,1,power_law_1.2,0.31655168533325195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,8,1,power_law_1.2,0.424661750793457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,8,1,power_law_1.2,0.440830078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,8,1,power_law_1.2,0.46144382476806645
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,8,1,power_law_1.2,0.48685760498046876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,8,1,power_law_1.2,5.764128417968751
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,8,1,power_law_1.2,0.5075027084350585
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,8,1,power_law_1.2,0.5195097732543945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,8,1,power_law_1.2,0.5464620971679688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,8,1,power_law_1.2,0.562421760559082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,8,1,power_law_1.2,0.5823513412475586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,8,1,power_law_1.2,0.7071494293212891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,8,1,power_law_1.2,7.341432495117187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,8,1,power_law_1.2,0.7686009979248046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,8,1,power_law_1.2,0.8292205047607422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,8,1,power_law_1.2,0.912332763671875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,8,1,power_law_1.2,1.0144767761230469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,8,1,power_law_1.2,9.139088134765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,8,1,power_law_1.2,1.2092671966552735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,16,1,power_law_1.01,0.05563072204589844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,8,1,power_law_1.2,1.3962969970703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,16,1,power_law_1.01,0.057013759613037104
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,16,1,power_law_1.01,0.06892223834991455
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,8,1,power_law_1.2,1.7876934814453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,16,1,power_law_1.01,0.0987667179107666
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,16,1,power_law_1.01,0.10105279922485351
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,16,1,power_law_1.01,0.10268287658691407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,16,1,power_law_1.01,0.10258048057556153
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,16,1,power_law_1.01,0.10338560104370118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,16,1,power_law_1.01,0.05127232074737549
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,16,1,power_law_1.01,0.10536064147949217
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,16,1,power_law_1.01,0.10963199615478517
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,16,1,power_law_1.01,0.11045696258544921
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,8,1,power_law_1.2,2.1494374084472656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,16,1,power_law_1.01,0.11531519889831543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,16,1,power_law_1.01,0.12024255752563477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,16,1,power_law_1.01,0.1249407958984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,16,1,power_law_1.01,0.1326259231567383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,16,1,power_law_1.01,0.14273599624633787
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,16,1,power_law_1.01,0.18509632110595703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,16,1,power_law_1.01,0.22656768798828125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,16,1,power_law_1.01,0.3209695816040039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,16,1,power_law_1.01,0.3981536102294922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,8,1,power_law_1.2,2.927506408691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,16,1,power_law_1.01,0.573100814819336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,16,1,power_law_1.01,0.7213760375976562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,16,1,power_law_1.01,0.03545151948928833
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,16,1,power_law_1.01,1.0513324737548828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,16,1,power_law_1.01,0.04003520011901855
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,16,1,power_law_1.01,0.042308478355407714
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,16,1,power_law_1.01,0.049086079597473145
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,16,1,power_law_1.01,1.379052734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,16,1,power_law_1.01,0.05691967964172363
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,16,1,power_law_1.01,0.05678719997406005
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,8,1,power_law_1.2,3.680823669433594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,16,1,power_law_1.01,0.05924223899841309
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,16,1,power_law_1.01,0.058745598793029784
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,16,1,power_law_1.01,0.05931519985198974
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,16,1,power_law_1.01,0.060294399261474604
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,16,1,power_law_1.01,0.06223487854003906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,16,1,power_law_1.01,0.06276095867156982
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,16,1,power_law_1.01,2.0356127929687498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,16,1,power_law_1.01,0.06655168056488037
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,16,1,power_law_1.01,0.07208000183105469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,16,1,power_law_1.01,0.07495168209075928
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,16,1,power_law_1.01,0.07723135948181152
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,16,1,power_law_1.01,0.07561344146728516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,16,1,power_law_1.01,0.08905535697937011
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.01,0.11560447692871094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,8,1,power_law_1.2,4.522938842773438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.01,0.1349132823944092
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.01,0.16268800735473632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.01,0.22180799484252928
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,16,1,power_law_1.01,2.6957351684570314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.01,0.2839583969116211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.01,0.4056447982788086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,16,1,power_law_1.2,0.04899775981903076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,16,1,power_law_1.2,0.05228352069854736
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.01,0.5133996963500976
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,16,1,power_law_1.2,0.0556870412826538
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,16,1,power_law_1.2,0.0695423984527588
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,16,1,power_law_1.2,0.09759615898132325
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.01,0.7664115142822265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,16,1,power_law_1.2,0.10086527824401856
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,16,1,power_law_1.2,0.10163647651672363
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,16,1,power_law_1.2,0.1027948760986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,16,1,power_law_1.01,3.3975244140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,16,1,power_law_1.2,0.1038047981262207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.01,0.9894668579101562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,16,1,power_law_1.2,0.10937536239624024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,16,1,power_law_1.2,0.10682239532470703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,16,1,power_law_1.2,0.11073087692260741
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,16,1,power_law_1.2,0.11633919715881347
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,16,1,power_law_1.2,0.12086463928222657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,16,1,power_law_1.2,0.12461567878723145
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.01,1.2619993591308594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,16,1,power_law_1.2,0.14127360343933107
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,16,1,power_law_1.2,0.14017600059509278
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,16,1,power_law_1.2,0.1818227195739746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,16,1,power_law_1.2,0.22890176773071289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,16,1,power_law_1.2,0.3258252716064453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,16,1,power_law_1.2,0.40342334747314457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,16,1,power_law_1.2,0.5609247970581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,16,1,power_law_1.2,0.7279436492919922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,16,1,power_law_1.2,0.035155200958251955
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,16,1,power_law_1.2,0.039635839462280276
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,16,1,power_law_1.2,0.040759038925170896
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,16,1,power_law_1.2,1.049266586303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,16,1,power_law_1.2,0.055252480506896975
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,16,1,power_law_1.2,0.05787775993347168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,16,1,power_law_1.2,1.3756268310546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,16,1,power_law_1.2,0.0576857614517212
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,16,1,power_law_1.2,0.05915328025817871
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,16,1,power_law_1.2,0.061284480094909666
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,16,1,power_law_1.2,0.06006080150604248
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,16,1,power_law_1.2,0.06148159980773926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,16,1,power_law_1.2,0.06299392223358155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,16,1,power_law_1.2,0.06724031925201415
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,16,1,power_law_1.2,2.0381190490722654
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,16,1,power_law_1.2,0.07259520053863525
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,16,1,power_law_1.2,0.07513728141784667
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,16,1,power_law_1.2,0.07684735774993896
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,16,1,power_law_1.2,0.07702847957611084
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,16,1,power_law_1.2,0.08786368370056152
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,16,1,power_law_1.2,0.11649791717529297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,16,1,power_law_1.2,0.1346540832519531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,16,1,power_law_1.2,0.16324031829833985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,16,1,power_law_1.2,2.6885400390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,16,1,power_law_1.2,0.2204742431640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,16,1,power_law_1.2,0.28530752182006835
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,16,1,power_law_1.2,0.40658943176269535
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,16,1,power_law_1.01,0.06378047943115235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,16,1,power_law_1.2,0.5255750274658203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,16,1,power_law_1.01,0.07174911975860596
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,16,1,power_law_1.01,0.07818624019622802
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,16,1,power_law_1.2,3.3931469726562495
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,16,1,power_law_1.2,0.7647270202636719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,16,1,power_law_1.2,0.04938240051269531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,16,1,power_law_1.01,0.1448243236541748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,16,1,power_law_1.01,0.14706239700317383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,16,1,power_law_1.01,0.14959872245788575
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,16,1,power_law_1.2,0.9994675445556641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,16,1,power_law_1.01,0.1513657569885254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,16,1,power_law_1.01,0.15081536293029785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,16,1,power_law_1.01,0.15539199829101563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,16,1,power_law_1.01,0.16036415100097656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,16,1,power_law_1.2,1.247612762451172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,16,1,power_law_1.01,0.1627315139770508
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,16,1,power_law_1.01,0.1730291175842285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,16,1,power_law_1.01,0.18083135604858397
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,16,1,power_law_1.01,0.18402816772460937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,16,1,power_law_1.01,0.19584768295288085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,16,1,power_law_1.01,0.20694271087646485
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,16,1,power_law_1.01,0.2995968055725098
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,16,1,power_law_1.01,0.39244800567626953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,16,1,power_law_1.01,0.09964799880981445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,16,1,power_law_1.01,0.49211711883544923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,16,1,power_law_1.01,0.6353523254394531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,16,1,power_law_1.01,0.9163520050048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,16,1,power_law_1.01,0.05017471790313721
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,16,1,power_law_1.01,1.1944403076171874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,16,1,power_law_1.01,0.052771840095520016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,16,1,power_law_1.01,0.06725503921508788
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,16,1,power_law_1.01,0.07636799812316894
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,16,1,power_law_1.01,1.7651199340820312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,16,1,power_law_1.01,0.07795775890350341
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,16,1,power_law_1.01,0.07812928199768067
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,16,1,power_law_1.01,0.08047167778015137
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,16,1,power_law_1.01,0.07989120006561279
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,16,1,power_law_1.01,0.08049535751342773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,16,1,power_law_1.01,0.08300288200378418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,16,1,power_law_1.01,0.08424575805664063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,16,1,power_law_1.01,2.3431365966796873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,16,1,power_law_1.01,0.08575039863586426
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,16,1,power_law_1.01,0.08934911727905273
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,16,1,power_law_1.01,0.09139391899108887
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,16,1,power_law_1.01,0.10003968238830567
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,16,1,power_law_1.01,0.10188991546630859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,16,1,power_law_1.01,0.14935487747192383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.01,0.1571129608154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.01,0.1895948791503906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.01,0.252604808807373
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,16,1,power_law_1.01,0.043909120559692386
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.01,0.3435161590576172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.01,0.43229568481445313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,16,1,power_law_1.01,3.494097900390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.01,0.6179142379760743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,16,1,power_law_1.2,0.07152128219604492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.01,0.7808544158935546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,16,1,power_law_1.2,0.07617152214050293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,16,1,power_law_1.2,0.10126015663146973
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.01,1.1859276580810547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,16,1,power_law_1.2,0.1429862403869629
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,16,1,power_law_1.01,4.632787170410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,16,1,power_law_1.2,0.14692288398742676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,16,1,power_law_1.2,0.15187135696411133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,16,1,power_law_1.2,0.14950719833374024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,16,1,power_law_1.2,0.15463808059692383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.01,1.586525421142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,16,1,power_law_1.2,0.06288703918457031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,16,1,power_law_1.2,0.1567404842376709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,16,1,power_law_1.2,0.16181951522827148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,16,1,power_law_1.2,0.16327360153198242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,16,1,power_law_1.2,0.16919872283935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,16,1,power_law_1.2,0.18743488311767578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,16,1,power_law_1.2,0.1861452865600586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.01,1.9948518371582034
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,16,1,power_law_1.2,0.20022207260131836
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,16,1,power_law_1.2,0.2049958419799805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,16,1,power_law_1.01,5.776571044921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,16,1,power_law_1.2,0.29712127685546874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,16,1,power_law_1.2,0.3889664077758789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,16,1,power_law_1.2,0.49428863525390626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,16,1,power_law_1.2,0.6442969512939454
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,16,1,power_law_1.2,0.9192940521240235
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,16,1,power_law_1.2,0.044765439033508304
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,16,1,power_law_1.2,1.1994745635986328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,16,1,power_law_1.2,0.04841599941253662
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,16,1,power_law_1.2,0.05213696002960205
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,16,1,power_law_1.2,1.764038391113281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,16,1,power_law_1.2,0.07614143848419189
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,16,1,power_law_1.2,0.0768230390548706
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,16,1,power_law_1.2,0.08096832275390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,16,1,power_law_1.2,0.07886144161224365
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,16,1,power_law_1.2,0.07969279766082764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,16,1,power_law_1.2,0.08176768302917481
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,16,1,power_law_1.2,0.08208448410034179
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,16,1,power_law_1.2,2.3419935607910154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,16,1,power_law_1.2,0.08378047943115234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,16,1,power_law_1.2,0.08544063568115234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,16,1,power_law_1.2,0.08894207954406738
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,16,1,power_law_1.2,0.09333951950073242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,16,1,power_law_1.2,0.10026687622070311
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,16,1,power_law_1.2,0.10185152053833009
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,16,1,power_law_1.2,0.14107328414916992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,16,1,power_law_1.2,0.15782400131225588
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,16,1,power_law_1.2,0.18785280227661133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,16,1,power_law_1.2,0.2507731246948242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,16,1,power_law_1.2,0.3397657775878906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,16,1,power_law_1.2,3.4851129150390627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,16,1,power_law_1.2,0.43411903381347655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,16,1,power_law_1.2,0.6196128082275391
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,16,1,power_law_1.2,0.06684351921081542
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,16,1,power_law_1.2,0.7934636688232422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,16,1,power_law_1.01,0.09405183792114258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,16,1,power_law_1.2,1.1912691497802734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,16,1,power_law_1.2,4.6426904296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,16,1,power_law_1.01,0.10334591865539551
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,16,1,power_law_1.01,0.10716032028198241
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,16,1,power_law_1.2,1.567955780029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,16,1,power_law_1.01,0.13329407691955567
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,16,1,power_law_1.01,0.17535232543945312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,16,1,power_law_1.2,2.0205842590332033
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,16,1,power_law_1.01,0.21287424087524415
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,16,1,power_law_1.2,5.784270019531251
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,16,1,power_law_1.01,0.28832191467285156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,16,1,power_law_1.01,0.3005081558227539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,16,1,power_law_1.01,0.3124083137512207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,16,1,power_law_1.01,0.3208281707763672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,16,1,power_law_1.01,0.3725964736938477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,16,1,power_law_1.01,0.41994049072265627
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,16,1,power_law_1.01,0.421135368347168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,16,1,power_law_1.01,0.43432769775390623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,16,1,power_law_1.01,0.4754220962524414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,16,1,power_law_1.01,0.4925651168823242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,16,1,power_law_1.01,0.5343936157226563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,16,1,power_law_1.01,0.6290611267089844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,16,1,power_law_1.01,0.7081049346923829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,16,1,power_law_1.01,0.7608582305908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,16,1,power_law_1.01,0.8352998352050781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,16,1,power_law_1.01,1.0783539581298829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,16,1,power_law_1.01,1.2879481506347656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,16,1,power_law_1.01,0.06026688098907471
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,16,1,power_law_1.01,0.07181312084197998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,16,1,power_law_1.01,1.779365692138672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,16,1,power_law_1.01,0.07753471851348877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,16,1,power_law_1.01,0.10553407669067383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,16,1,power_law_1.01,2.262238006591797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,16,1,power_law_1.01,0.1402937602996826
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,16,1,power_law_1.01,0.17609472274780275
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,16,1,power_law_1.01,0.24265663146972657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,16,1,power_law_1.01,0.2522143936157227
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,16,1,power_law_1.01,0.2580831909179687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,16,1,power_law_1.01,0.2629779243469238
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,16,1,power_law_1.01,0.27493824005126954
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,16,1,power_law_1.01,3.2290853881835937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,16,1,power_law_1.01,0.28402816772460937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,16,1,power_law_1.01,0.29890560150146483
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,16,1,power_law_1.01,0.30291839599609377
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,16,1,power_law_1.01,0.37262081146240233
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,16,1,power_law_1.01,0.3788883209228516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,16,1,power_law_1.01,0.3975155258178711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,16,1,power_law_1.01,4.226067810058593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,16,1,power_law_1.01,0.4219769668579102
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.01,0.45581310272216796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.01,0.5487353515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.01,0.608427505493164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,16,1,power_law_1.01,5.18083251953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.01,0.7362131500244141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.01,0.9076985931396484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.01,1.191685104370117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,16,1,power_law_1.2,0.09408255577087402
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,16,1,power_law_1.2,0.10335424423217773
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,16,1,power_law_1.2,0.10530048370361329
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.01,1.4965939331054687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,16,1,power_law_1.2,0.12787584304809568
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,16,1,power_law_1.2,0.15771136283874512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,16,1,power_law_1.2,0.19744575500488282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.01,2.091455993652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,16,1,power_law_1.2,0.2826028823852539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,16,1,power_law_1.2,0.2965260887145996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,16,1,power_law_1.2,0.30617279052734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,16,1,power_law_1.2,0.3244403076171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.01,2.6954855346679687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,16,1,power_law_1.2,0.3937209701538086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,16,1,power_law_1.2,0.41924095153808594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,16,1,power_law_1.2,0.42786304473876957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,16,1,power_law_1.2,0.4405344009399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.01,3.3113543701171877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,16,1,power_law_1.2,0.5002924728393554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,16,1,power_law_1.2,0.5157721710205079
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,16,1,power_law_1.2,0.5662080001831055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,16,1,power_law_1.2,0.6959391784667969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,16,1,power_law_1.2,0.7307622528076172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,16,1,power_law_1.2,0.7902265930175781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,16,1,power_law_1.2,0.8664832305908202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,16,1,power_law_1.2,1.1028697967529297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,16,1,power_law_1.2,1.331481628417969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,16,1,power_law_1.2,0.060128641128540036
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,16,1,power_law_1.2,0.0715174388885498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,16,1,power_law_1.2,1.8096095275878905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,16,1,power_law_1.2,0.075033597946167
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,16,1,power_law_1.2,0.09917183876037597
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,16,1,power_law_1.2,2.277996826171875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,16,1,power_law_1.2,0.12925312042236328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,16,1,power_law_1.2,0.16235456466674805
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,16,1,power_law_1.2,0.2409382438659668
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,16,1,power_law_1.2,0.24728832244873047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,16,1,power_law_1.2,0.2592115211486816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,16,1,power_law_1.2,3.2753875732421873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,16,1,power_law_1.2,0.26169151306152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,16,1,power_law_1.2,0.2746137619018555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,16,1,power_law_1.2,0.28285375595092777
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,16,1,power_law_1.2,0.29079551696777345
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,16,1,power_law_1.2,0.3140134429931641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,16,1,power_law_1.2,4.223359985351562
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,16,1,power_law_1.2,0.38226047515869144
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,16,1,power_law_1.2,0.39213439941406253
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,16,1,power_law_1.2,0.40639297485351566
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,16,1,power_law_1.2,0.45255168914794924
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,16,1,power_law_1.2,0.5075225448608398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,16,1,power_law_1.2,0.5723532867431641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,16,1,power_law_1.2,0.633546257019043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,16,1,power_law_1.2,0.7721555328369141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,16,1,power_law_1.2,5.196455078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,16,1,power_law_1.2,0.9284307098388671
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,16,1,power_law_1.2,1.2067584228515624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,16,1,power_law_1.2,1.5176824951171874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,16,1,power_law_1.01,0.04039360046386718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,16,1,power_law_1.01,0.05711040019989013
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,16,1,power_law_1.01,0.06199488162994384
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,16,1,power_law_1.2,2.1119544982910154
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,16,1,power_law_1.01,0.07087679862976073
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,16,1,power_law_1.01,0.11008895874023436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,16,1,power_law_1.01,0.11270336151123046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,16,1,power_law_1.01,0.12185600280761719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,16,1,power_law_1.2,2.7241778564453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,16,1,power_law_1.01,0.1316716766357422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,16,1,power_law_1.01,0.1414355182647705
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,16,1,power_law_1.01,0.07932544231414795
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,16,1,power_law_1.01,0.14447296142578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,16,1,power_law_1.01,0.10387583732604981
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,16,1,power_law_1.01,0.14934144020080567
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,16,1,power_law_1.01,0.1541107177734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,16,1,power_law_1.01,0.15743231773376465
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,16,1,power_law_1.01,0.16716224670410157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,16,1,power_law_1.2,3.347134704589844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,16,1,power_law_1.01,0.18915647506713867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,16,1,power_law_1.01,0.20676671981811526
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,16,1,power_law_1.01,0.11779647827148439
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,16,1,power_law_1.01,0.2699551963806152
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,16,1,power_law_1.01,0.3328806304931641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,16,1,power_law_1.01,0.47238208770751955
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,16,1,power_law_1.01,0.582677116394043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,16,1,power_law_1.01,0.03788800001144409
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,16,1,power_law_1.01,0.042524161338806155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,16,1,power_law_1.01,0.8195161437988281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,16,1,power_law_1.01,0.05016384124755859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,16,1,power_law_1.01,0.05923007965087891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,16,1,power_law_1.01,1.0691136169433595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,16,1,power_law_1.01,0.07007936000823975
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,16,1,power_law_1.01,0.09292927742004395
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,16,1,power_law_1.01,0.09986175537109375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,16,1,power_law_1.01,0.10372672080993653
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,16,1,power_law_1.01,0.10597439765930176
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,16,1,power_law_1.01,0.10712960243225098
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,16,1,power_law_1.01,1.558983612060547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,16,1,power_law_1.01,0.11073344230651856
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,16,1,power_law_1.01,0.1329759979248047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,16,1,power_law_1.01,0.1347987174987793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,16,1,power_law_1.01,0.14097023963928224
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,16,1,power_law_1.01,0.14521408081054688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,16,1,power_law_1.01,0.1510099220275879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,16,1,power_law_1.01,2.0625817871093752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,16,1,power_law_1.01,0.1663929557800293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,16,1,power_law_1.01,0.19395456314086915
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,16,1,power_law_1.01,0.21304704666137697
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,16,1,power_law_1.01,0.2516774368286133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,16,1,power_law_1.01,2.5495706176757813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,16,1,power_law_1.01,0.29400896072387694
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,16,1,power_law_1.01,0.39611839294433593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,16,1,power_law_1.01,0.47538494110107427
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,16,1,power_law_1.01,0.658990707397461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,16,1,power_law_1.01,0.845902099609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,16,1,power_law_1.2,0.06059008121490479
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,16,1,power_law_1.2,0.06817599773406982
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,16,1,power_law_1.2,0.07661439895629882
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,16,1,power_law_1.01,1.2178809356689453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,16,1,power_law_1.2,0.10415616035461425
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,16,1,power_law_1.2,0.04323391914367676
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,16,1,power_law_1.2,0.11100159645080568
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,16,1,power_law_1.2,0.1148192024230957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,16,1,power_law_1.2,0.054978561401367185
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,16,1,power_law_1.2,0.11968192100524902
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,16,1,power_law_1.01,1.5880178833007812
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,16,1,power_law_1.2,0.12263168334960936
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,16,1,power_law_1.2,0.13110272407531737
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,16,1,power_law_1.2,0.1438758373260498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,16,1,power_law_1.01,1.963356170654297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,16,1,power_law_1.2,0.14523327827453614
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,16,1,power_law_1.2,0.15103167533874512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,16,1,power_law_1.2,0.15596608161926268
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,16,1,power_law_1.2,0.15896384239196776
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,16,1,power_law_1.2,0.16980480194091796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,16,1,power_law_1.2,0.18952896118164062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,16,1,power_law_1.2,0.2108780860900879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,16,1,power_law_1.2,0.2779520034790039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,16,1,power_law_1.2,0.3336191940307617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,16,1,power_law_1.2,0.4761171340942383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,16,1,power_law_1.2,0.5887155151367187
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,16,1,power_law_1.2,0.8249337768554688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,16,1,power_law_1.2,0.04267199993133545
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,16,1,power_law_1.2,0.048914561271667475
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,16,1,power_law_1.2,1.073278045654297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,16,1,power_law_1.2,0.056005120277404785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,16,1,power_law_1.2,0.06585984230041504
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,16,1,power_law_1.2,0.09633983612060547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,16,1,power_law_1.2,0.10182080268859864
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,16,1,power_law_1.2,0.10496512413024903
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,16,1,power_law_1.2,1.576907501220703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,16,1,power_law_1.2,0.10752511978149415
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,16,1,power_law_1.2,0.10834752082824708
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,16,1,power_law_1.2,0.11171520233154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,16,1,power_law_1.2,0.13576000213623046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,16,1,power_law_1.2,0.1368671989440918
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,16,1,power_law_1.2,2.085107879638672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,16,1,power_law_1.2,0.14396608352661133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,16,1,power_law_1.2,0.1521887969970703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,16,1,power_law_1.2,0.15941247940063477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,16,1,power_law_1.2,0.18006656646728517
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,16,1,power_law_1.2,0.19591487884521483
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,16,1,power_law_1.2,2.5835711669921873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,16,1,power_law_1.2,0.21565631866455076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,16,1,power_law_1.2,0.038215041160583496
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,16,1,power_law_1.2,0.25717056274414063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,16,1,power_law_1.2,0.2968204879760742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,16,1,power_law_1.2,0.4000780868530273
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,16,1,power_law_1.2,0.4815865707397461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,16,1,power_law_1.2,0.6636665344238282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,16,1,power_law_1.01,0.08770496368408202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,16,1,power_law_1.2,0.8463897705078125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,16,1,power_law_1.01,0.12213760375976564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,16,1,power_law_1.01,0.15138431549072268
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,16,1,power_law_1.2,1.2237760162353515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,16,1,power_law_1.01,0.08000063896179199
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,16,1,power_law_1.01,0.22561151504516602
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,16,1,power_law_1.2,1.5951948547363282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,16,1,power_law_1.01,0.24375680923461912
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,16,1,power_law_1.01,0.2572863960266113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,16,1,power_law_1.01,0.26716735839843747
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,16,1,power_law_1.01,0.2774784088134766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,16,1,power_law_1.01,0.09701120376586914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,16,1,power_law_1.01,0.311213436126709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,16,1,power_law_1.2,1.9736883544921873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,16,1,power_law_1.01,0.3413734436035156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,16,1,power_law_1.01,0.3237088012695312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,16,1,power_law_1.01,0.339749755859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,16,1,power_law_1.01,0.3555072021484375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,16,1,power_law_1.01,0.36741119384765625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,16,1,power_law_1.01,0.41696319580078123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,16,1,power_law_1.01,0.49137535095214846
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,16,1,power_law_1.01,0.5585472106933593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,16,1,power_law_1.01,0.6117625427246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,16,1,power_law_1.01,0.720983657836914
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,16,1,power_law_1.01,0.9532038116455078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,16,1,power_law_1.01,1.1894700622558594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,16,1,power_law_1.01,0.0630176019668579
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,16,1,power_law_1.01,1.6969938659667967
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,16,1,power_law_1.01,0.07398975849151611
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,16,1,power_law_1.01,0.09732288360595703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,16,1,power_law_1.01,2.1661389160156252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,16,1,power_law_1.01,0.1202566432952881
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,16,1,power_law_1.01,0.18550399780273436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,16,1,power_law_1.01,0.19566272735595702
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,16,1,power_law_1.01,0.20376703262329104
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,16,1,power_law_1.01,0.20942720413208007
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,16,1,power_law_1.01,3.1918911743164062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,16,1,power_law_1.01,0.2125657653808594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,16,1,power_law_1.01,0.05358272075653077
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,16,1,power_law_1.01,0.21904384613037112
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,16,1,power_law_1.01,0.22425344467163083
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,16,1,power_law_1.01,0.3014348793029785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,16,1,power_law_1.01,0.305096321105957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,16,1,power_law_1.01,0.3108211135864258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,16,1,power_law_1.01,0.3163091278076172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,16,1,power_law_1.01,4.161849670410156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,16,1,power_law_1.01,0.3300806427001953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,16,1,power_law_1.01,0.3636095809936523
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.01,0.3918368148803711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.01,0.48035839080810544
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.01,0.554733428955078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,16,1,power_law_1.01,5.138936767578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.01,0.7188025665283203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.01,0.8779859161376953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,16,1,power_law_1.2,0.08339008331298828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.01,1.2111634826660156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,16,1,power_law_1.2,0.09574848175048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.01,1.5395820617675782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,16,1,power_law_1.2,0.11579456329345703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,16,1,power_law_1.2,0.1388383960723877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,16,1,power_law_1.2,0.22194368362426758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,16,1,power_law_1.2,0.08010239601135254
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,16,1,power_law_1.2,0.2450822448730469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,16,1,power_law_1.2,0.2613747215270996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.01,2.2153637695312502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,16,1,power_law_1.2,0.27681856155395507
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,16,1,power_law_1.2,0.2919385528564453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,16,1,power_law_1.2,0.3380390548706055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,16,1,power_law_1.2,0.35546943664550784
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,16,1,power_law_1.2,0.3424147033691406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,16,1,power_law_1.2,0.3555801773071289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,16,1,power_law_1.2,0.379510383605957
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.01,2.8633843994140626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,16,1,power_law_1.2,0.396440315246582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,16,1,power_law_1.2,0.4324639892578125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,16,1,power_law_1.2,0.5254841613769531
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,16,1,power_law_1.2,0.5602137756347656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.01,3.5288903808593752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,16,1,power_law_1.2,0.6309049606323243
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,16,1,power_law_1.2,0.7352486419677734
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,16,1,power_law_1.2,0.9672070312500001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,16,1,power_law_1.2,1.2120543670654296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,16,1,power_law_1.2,0.060698242187499994
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,16,1,power_law_1.2,0.07288512229919433
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,16,1,power_law_1.2,1.7086802673339843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,16,1,power_law_1.2,0.0915724754333496
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,16,1,power_law_1.2,0.11088255882263183
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,16,1,power_law_1.2,2.213274230957031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,16,1,power_law_1.2,0.18435775756835937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,16,1,power_law_1.2,0.19553600311279298
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,16,1,power_law_1.2,0.2066726493835449
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,16,1,power_law_1.2,0.21213632583618164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,16,1,power_law_1.2,0.21758848190307617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,16,1,power_law_1.2,0.22099136352539062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,16,1,power_law_1.2,3.1885882568359376
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,16,1,power_law_1.2,0.05412223815917969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,16,1,power_law_1.2,0.2298355293273926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,16,1,power_law_1.2,0.3071564865112305
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,16,1,power_law_1.2,0.31267776489257815
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,16,1,power_law_1.2,0.3186297607421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,16,1,power_law_1.2,0.32667198181152346
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,16,1,power_law_1.2,0.33941184997558593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,16,1,power_law_1.2,0.36781375885009765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,16,1,power_law_1.2,4.183402099609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,16,1,power_law_1.2,0.40154689788818365
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,16,1,power_law_1.2,0.49461822509765624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,16,1,power_law_1.2,0.5576691055297852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,16,1,power_law_1.2,5.147945556640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,16,1,power_law_1.2,0.7330316925048829
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,16,1,power_law_1.2,0.8822509002685546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,16,1,power_law_1.2,1.2215392303466797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,16,1,power_law_1.2,1.552849884033203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,16,1,power_law_1.01,0.11705727577209472
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,16,1,power_law_1.01,0.12590527534484863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,16,1,power_law_1.01,0.13888768196105955
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,16,1,power_law_1.2,2.220819854736328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,16,1,power_law_1.01,0.14836480140686034
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,16,1,power_law_1.01,0.2107200050354004
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,16,1,power_law_1.01,0.2764908790588379
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,16,1,power_law_1.01,0.3120607948303223
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,16,1,power_law_1.2,2.8938259887695312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,16,1,power_law_1.01,0.4578911972045899
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,16,1,power_law_1.01,0.46635520935058594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,16,1,power_law_1.01,0.47652416229248046
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,16,1,power_law_1.01,0.4863590240478516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,16,1,power_law_1.01,0.4986316680908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,16,1,power_law_1.2,3.532140197753906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,16,1,power_law_1.01,0.5071161651611329
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,16,1,power_law_1.01,0.52229248046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,16,1,power_law_1.01,0.5461536026000976
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,16,1,power_law_1.01,0.5720166397094727
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,16,1,power_law_1.01,0.7603654479980468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,16,1,power_law_1.01,0.8086930847167968
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,16,1,power_law_1.01,0.8538374328613282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,16,1,power_law_1.01,0.9542540740966796
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,16,1,power_law_1.01,1.0832364654541016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,16,1,power_law_1.01,1.329698486328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,16,1,power_law_1.01,1.5879840087890624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,16,1,power_law_1.01,0.07545728206634521
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,16,1,power_law_1.01,0.08669376373291016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,16,1,power_law_1.01,2.0890515136718752
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,16,1,power_law_1.01,0.10349568367004394
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,16,1,power_law_1.01,0.11205375671386719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,16,1,power_law_1.01,2.5833837890624998
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,16,1,power_law_1.01,0.16980672836303712
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,16,1,power_law_1.01,0.23516544342041015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,16,1,power_law_1.01,0.2588319969177246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,16,1,power_law_1.01,3.528176574707031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,16,1,power_law_1.01,0.3123788833618164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,16,1,power_law_1.01,0.3305260848999024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,16,1,power_law_1.01,0.34304256439208985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,16,1,power_law_1.01,0.3641715240478516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,16,1,power_law_1.01,0.3748665618896484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,16,1,power_law_1.01,4.521795959472657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,16,1,power_law_1.01,0.3883116912841797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,16,1,power_law_1.01,0.40319679260253904
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,16,1,power_law_1.01,0.4161478424072266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,16,1,power_law_1.01,0.4222393417358399
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,16,1,power_law_1.01,0.5385465621948242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,16,1,power_law_1.01,0.5704294586181641
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,16,1,power_law_1.01,5.573698120117188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.01,0.6059142303466797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.01,0.6765555572509766
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.01,0.7566201782226563
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.01,0.9163641357421876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.01,1.0575846099853516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,16,1,power_law_1.2,0.11666048049926758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,16,1,power_law_1.2,0.12596735954284669
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.01,1.379694061279297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,16,1,power_law_1.2,0.132609281539917
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.01,1.6954757690429687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,16,1,power_law_1.2,0.14879039764404295
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,16,1,power_law_1.2,0.19391487121582032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.01,2.351848907470703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,16,1,power_law_1.2,0.2498758316040039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,16,1,power_law_1.2,0.28820928573608395
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,16,1,power_law_1.2,0.44864383697509763
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,16,1,power_law_1.2,0.45890239715576175
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.01,2.9973907470703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,16,1,power_law_1.2,0.46908416748046877
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,16,1,power_law_1.2,0.4826252746582031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,16,1,power_law_1.2,0.4942739105224609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,16,1,power_law_1.2,0.500195198059082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,16,1,power_law_1.2,0.5182144165039062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.01,3.7112960815429688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,16,1,power_law_1.2,0.5478656005859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,16,1,power_law_1.2,0.5862521743774414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,16,1,power_law_1.2,0.764755859375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,16,1,power_law_1.2,0.816343002319336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,16,1,power_law_1.2,0.8740895843505859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,16,1,power_law_1.2,0.9928729248046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,16,1,power_law_1.2,1.1293113708496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,16,1,power_law_1.2,1.3637606811523437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,16,1,power_law_1.2,1.6503736877441404
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,16,1,power_law_1.2,0.07509312152862549
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,16,1,power_law_1.2,0.08666687965393066
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,16,1,power_law_1.2,2.114038391113281
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,16,1,power_law_1.2,0.09553407669067383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,16,1,power_law_1.2,2.600782165527344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,16,1,power_law_1.2,0.11268287658691407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,16,1,power_law_1.2,0.15285568237304686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,16,1,power_law_1.2,0.19997440338134767
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,16,1,power_law_1.2,0.24308544158935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,16,1,power_law_1.2,0.30082496643066403
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,16,1,power_law_1.2,0.31892351150512693
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,16,1,power_law_1.2,3.5761260986328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,16,1,power_law_1.2,0.3305344009399414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,16,1,power_law_1.2,0.3508620834350586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,16,1,power_law_1.2,0.367710075378418
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,16,1,power_law_1.2,0.37880897521972656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,16,1,power_law_1.2,0.3959328079223633
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,16,1,power_law_1.2,0.41247806549072263
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,16,1,power_law_1.2,4.605513610839844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,16,1,power_law_1.2,0.4251859283447265
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,16,1,power_law_1.2,0.5405311965942383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,16,1,power_law_1.2,0.5821049499511719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,16,1,power_law_1.2,5.636915283203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,16,1,power_law_1.2,0.6219641494750976
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,16,1,power_law_1.2,0.7085747528076172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,16,1,power_law_1.2,0.8064755249023439
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,32,1,power_law_1.01,0.04291520118713379
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,16,1,power_law_1.2,0.9588365173339843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,32,1,power_law_1.01,0.045980157852172854
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,16,1,power_law_1.2,1.1346080017089843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,32,1,power_law_1.01,0.0479750394821167
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,32,1,power_law_1.01,0.05427711963653564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,32,1,power_law_1.01,0.08019071578979492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,32,1,power_law_1.01,0.08162943840026855
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,32,1,power_law_1.01,0.08293951988220215
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,32,1,power_law_1.01,0.08401280403137207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,16,1,power_law_1.2,1.4552928161621093
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,32,1,power_law_1.01,0.08471232414245605
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,32,1,power_law_1.01,0.08594367980957032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,32,1,power_law_1.01,0.08919872283935547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,32,1,power_law_1.01,0.09027968406677246
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,32,1,power_law_1.01,0.0938047981262207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,32,1,power_law_1.01,0.09669376373291015
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,16,1,power_law_1.2,1.7773561096191408
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,32,1,power_law_1.01,0.09996671676635742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,32,1,power_law_1.01,0.1057260799407959
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,32,1,power_law_1.01,0.10797504425048828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,32,1,power_law_1.01,0.12211520195007323
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,32,1,power_law_1.01,0.1370963191986084
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,32,1,power_law_1.01,0.18261247634887695
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,32,1,power_law_1.01,0.2338060760498047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,32,1,power_law_1.01,0.34334014892578124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,32,1,power_law_1.01,0.4193868637084961
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,16,1,power_law_1.2,2.4185087585449216
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,32,1,power_law_1.01,0.599478416442871
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,32,1,power_law_1.01,0.78242431640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,16,1,power_law_1.2,3.0908978271484377
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,32,1,power_law_1.01,1.1438771057128907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,32,1,power_law_1.01,0.036018559932708735
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,32,1,power_law_1.01,0.05101376056671143
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,32,1,power_law_1.01,0.05136256217956543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,32,1,power_law_1.01,1.5112896728515626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,16,1,power_law_1.2,3.7337869262695316
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,32,1,power_law_1.01,0.05250688076019287
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,32,1,power_law_1.01,0.053498878479003906
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,32,1,power_law_1.01,0.05457151889801025
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,32,1,power_law_1.01,0.05589888095855713
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,32,1,power_law_1.01,0.05600255966186524
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,32,1,power_law_1.01,1.8864250183105469
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,32,1,power_law_1.01,0.05796671867370605
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,32,1,power_law_1.01,0.061432318687438967
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,32,1,power_law_1.01,0.06651968002319336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,32,1,power_law_1.01,0.06932735919952393
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,32,1,power_law_1.01,0.07262015819549561
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,32,1,power_law_1.01,0.06959104061126709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,32,1,power_law_1.01,0.07924672126770019
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.01,0.08617983818054199
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.01,0.10317248344421386
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.01,0.14356032371520996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.01,0.18234943389892577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.01,0.2413075256347656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.01,0.33142078399658204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,32,1,power_law_1.01,0.03028223991394043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.01,0.405665283203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,14336,2,8,32,1,power_law_1.2,0.04276095867156983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,14336,2,8,32,1,power_law_1.2,0.04520063877105713
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,32,1,power_law_1.01,0.036224639415740965
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.01,0.5842099380493164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,14336,2,8,32,1,power_law_1.2,0.047388801574707026
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,14336,2,8,32,1,power_law_1.2,0.07936511993408203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,14336,2,8,32,1,power_law_1.2,0.08173760414123535
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,14336,2,8,32,1,power_law_1.2,0.08262656211853028
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.01,0.77238525390625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,14336,2,8,32,1,power_law_1.2,0.08431679725646972
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,32,1,power_law_1.01,0.037234559059143066
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,14336,2,8,32,1,power_law_1.2,0.08504575729370117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,14336,2,8,32,1,power_law_1.2,0.08607487678527832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,14336,2,8,32,1,power_law_1.2,0.0888486385345459
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.01,0.9579065704345704
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,14336,2,8,32,1,power_law_1.2,0.09078399658203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,14336,2,8,32,1,power_law_1.2,0.09298879623413085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,14336,2,8,32,1,power_law_1.2,0.09643712043762206
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,14336,2,8,32,1,power_law_1.2,0.10007871627807616
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,14336,2,8,32,1,power_law_1.2,0.10627072334289552
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,14336,2,8,32,1,power_law_1.2,0.10793343544006348
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,14336,2,8,32,1,power_law_1.2,0.12116415977478028
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,14336,2,8,32,1,power_law_1.2,0.13789183616638184
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,14336,2,8,32,1,power_law_1.2,0.18163391113281252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,14336,2,8,32,1,power_law_1.2,0.23469568252563477
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,14336,2,8,32,1,power_law_1.2,0.053750400543212895
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,14336,2,8,32,1,power_law_1.2,0.34326145172119144
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,14336,2,8,32,1,power_law_1.2,0.4173606491088867
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,14336,2,8,32,1,power_law_1.2,0.03539391994476319
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,14336,2,8,32,1,power_law_1.2,0.03660864114761352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,14336,2,8,32,1,power_law_1.2,0.5999411010742188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,14336,2,8,32,1,power_law_1.2,0.03623296022415161
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,14336,2,8,32,1,power_law_1.2,0.7818803405761718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,14336,2,8,32,1,power_law_1.2,0.05060991764068603
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,14336,2,8,32,1,power_law_1.2,0.05167679786682129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,14336,2,8,32,1,power_law_1.2,0.05217599868774414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,14336,2,8,32,1,power_law_1.2,0.05407680034637451
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,14336,2,8,32,1,power_law_1.2,0.053417601585388184
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,14336,2,8,32,1,power_law_1.2,0.055015039443969724
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,14336,2,8,32,1,power_law_1.2,1.1419718170166016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,14336,2,8,32,1,power_law_1.2,0.05598464012145996
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,14336,2,8,32,1,power_law_1.2,0.058221440315246585
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,14336,2,8,32,1,power_law_1.2,0.06226111888885498
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,14336,2,8,32,1,power_law_1.2,0.06623807907104493
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,14336,2,8,32,1,power_law_1.2,0.06933311939239502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,14336,2,8,32,1,power_law_1.2,0.07116608142852783
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,14336,2,8,32,1,power_law_1.2,0.06952576160430908
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,14336,2,8,32,1,power_law_1.2,1.5092262268066405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,14336,2,8,32,1,power_law_1.2,0.07885503768920898
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,14336,2,8,32,1,power_law_1.2,0.08551296234130859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,14336,2,8,32,1,power_law_1.2,0.10289664268493652
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,14336,2,8,32,1,power_law_1.2,0.14404095649719237
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,14336,2,8,32,1,power_law_1.2,0.18190208435058594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,14336,2,8,32,1,power_law_1.2,1.8723231506347655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,14336,2,8,32,1,power_law_1.2,0.23937536239624024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,14336,2,8,32,1,power_law_1.2,0.3326630401611328
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,14336,2,8,32,1,power_law_1.2,0.41088703155517575
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,32,1,power_law_1.01,0.0559980821609497
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,32,1,power_law_1.01,0.0621779203414917
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,32,1,power_law_1.01,0.06357952117919921
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,14336,2,8,32,1,power_law_1.2,0.5864716720581055
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,32,1,power_law_1.01,0.07364352226257324
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,32,1,power_law_1.01,0.11315391540527345
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,14336,2,8,32,1,power_law_1.2,0.030429439544677733
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,32,1,power_law_1.01,0.11424256324768067
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,14336,2,8,32,1,power_law_1.2,0.7697644805908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,32,1,power_law_1.01,0.11788991928100585
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,32,1,power_law_1.01,0.11821824073791505
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,32,1,power_law_1.01,0.11931967735290527
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,32,1,power_law_1.01,0.12424575805664062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,32,1,power_law_1.01,0.12117952346801757
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,14336,2,8,32,1,power_law_1.2,0.9544377899169921
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,32,1,power_law_1.01,0.12657919883728028
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,32,1,power_law_1.01,0.132294397354126
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,32,1,power_law_1.01,0.13973376274108887
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,32,1,power_law_1.01,0.14414079666137697
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,32,1,power_law_1.01,0.1478623962402344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,32,1,power_law_1.01,0.1525011157989502
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,32,1,power_law_1.01,0.17380287170410155
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,32,1,power_law_1.01,0.1960492706298828
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,32,1,power_law_1.01,0.28040447235107424
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,32,1,power_law_1.01,0.36458881378173824
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,32,1,power_law_1.01,0.5096473693847656
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,32,1,power_law_1.01,0.6666214752197266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,32,1,power_law_1.01,0.04307583808898926
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,32,1,power_law_1.01,0.04362815856933594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,32,1,power_law_1.01,0.9719859313964843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,32,1,power_law_1.01,0.053994879722595215
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,32,1,power_law_1.01,0.06684415817260743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,32,1,power_law_1.01,1.2731584167480468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,32,1,power_law_1.01,0.0694816017150879
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,32,1,power_law_1.01,0.06835904121398925
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,32,1,power_law_1.01,0.06968448162078858
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,32,1,power_law_1.01,0.07162496089935302
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,32,1,power_law_1.01,0.07167871952056884
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,32,1,power_law_1.01,0.07283455848693847
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,32,1,power_law_1.01,0.0743769598007202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,32,1,power_law_1.01,0.07635519981384278
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,32,1,power_law_1.01,0.07873600006103516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,32,1,power_law_1.01,1.8912319946289062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,32,1,power_law_1.01,0.0814470386505127
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,32,1,power_law_1.01,0.08545344352722169
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,32,1,power_law_1.01,0.08783679962158203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,32,1,power_law_1.01,0.10105024337768556
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.01,0.11120767593383789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.01,0.1387839984893799
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.01,0.19330047607421874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.01,0.24423871994018556
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,32,1,power_law_1.01,2.503095703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.01,0.32669631958007816
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.01,0.4556569671630859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,16384,2,8,32,1,power_law_1.2,0.05615295886993408
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.01,0.5578566360473632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,16384,2,8,32,1,power_law_1.2,0.06094399929046631
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,16384,2,8,32,1,power_law_1.2,0.06337279796600341
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,32,1,power_law_1.01,0.04001088142395019
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,16384,2,8,32,1,power_law_1.2,0.07359488010406494
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,32,1,power_law_1.01,3.1118151855468748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.01,0.8085868835449219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,16384,2,8,32,1,power_law_1.2,0.11201984405517577
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,16384,2,8,32,1,power_law_1.2,0.11481727600097655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,16384,2,8,32,1,power_law_1.2,0.11662015914916993
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,16384,2,8,32,1,power_law_1.2,0.11766847610473632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,16384,2,8,32,1,power_law_1.2,0.12093824386596679
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,16384,2,8,32,1,power_law_1.2,0.12213567733764648
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,16384,2,8,32,1,power_law_1.2,0.12456447601318359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.01,1.074339828491211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,16384,2,8,32,1,power_law_1.2,0.12695487976074218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,16384,2,8,32,1,power_law_1.2,0.13009407997131348
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,16384,2,8,32,1,power_law_1.2,0.13988287925720216
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,16384,2,8,32,1,power_law_1.2,0.14449536323547363
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,16384,2,8,32,1,power_law_1.2,0.14883647918701173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,16384,2,8,32,1,power_law_1.2,0.15216575622558595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,16384,2,8,32,1,power_law_1.2,0.17330879211425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.01,1.338146514892578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,16384,2,8,32,1,power_law_1.2,0.1977343940734863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,16384,2,8,32,1,power_law_1.2,0.2814739227294922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,16384,2,8,32,1,power_law_1.2,0.379315185546875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,16384,2,8,32,1,power_law_1.2,0.5103385543823242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,16384,2,8,32,1,power_law_1.2,0.03969343900680542
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,16384,2,8,32,1,power_law_1.2,0.6676351928710937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,16384,2,8,32,1,power_law_1.2,0.043877120018005374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,16384,2,8,32,1,power_law_1.2,0.0535148811340332
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,16384,2,8,32,1,power_law_1.2,0.9653036499023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,16384,2,8,32,1,power_law_1.2,0.06719488143920899
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,16384,2,8,32,1,power_law_1.2,0.06837056159973146
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,16384,2,8,32,1,power_law_1.2,0.06953919887542724
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,16384,2,8,32,1,power_law_1.2,0.06989952087402343
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,16384,2,8,32,1,power_law_1.2,1.2727449798583985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,16384,2,8,32,1,power_law_1.2,0.07091392040252685
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,16384,2,8,32,1,power_law_1.2,0.07107135772705078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,16384,2,8,32,1,power_law_1.2,0.07277567863464356
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,16384,2,8,32,1,power_law_1.2,0.07538879871368408
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,16384,2,8,32,1,power_law_1.2,0.07613759994506836
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,16384,2,8,32,1,power_law_1.2,0.07901440143585206
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,16384,2,8,32,1,power_law_1.2,0.08132160186767579
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,16384,2,8,32,1,power_law_1.2,0.08703167915344238
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,16384,2,8,32,1,power_law_1.2,1.8839967346191409
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,16384,2,8,32,1,power_law_1.2,0.0874233627319336
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,16384,2,8,32,1,power_law_1.2,0.10025792121887207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,16384,2,8,32,1,power_law_1.2,0.10880895614624024
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,16384,2,8,32,1,power_law_1.2,0.13898048400878907
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,16384,2,8,32,1,power_law_1.2,0.1956768035888672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,16384,2,8,32,1,power_law_1.2,0.24392000198364258
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,16384,2,8,32,1,power_law_1.2,2.5001478576660157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,16384,2,8,32,1,power_law_1.2,0.3240358352661133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,16384,2,8,32,1,power_law_1.2,0.4564543914794922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,16384,2,8,32,1,power_law_1.2,0.5719462585449219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,16384,2,8,32,1,power_law_1.2,3.119928894042969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,16384,2,8,32,1,power_law_1.2,0.04212672233581543
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,16384,2,8,32,1,power_law_1.2,0.8231308746337891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,32,1,power_law_1.01,0.0721459197998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,16384,2,8,32,1,power_law_1.2,1.0716883087158204
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,32,1,power_law_1.01,0.0962816047668457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,32,1,power_law_1.01,0.1003769588470459
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,32,1,power_law_1.01,0.1154361629486084
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,16384,2,8,32,1,power_law_1.2,1.3446733093261718
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,32,1,power_law_1.01,0.13683456420898438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,32,1,power_law_1.01,0.16046911239624023
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,32,1,power_law_1.01,0.19976383209228515
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,32,1,power_law_1.01,0.2045017623901367
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,32,1,power_law_1.01,0.21156799316406252
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,32,1,power_law_1.01,0.2151468849182129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,32,1,power_law_1.01,0.23146047592163085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,32,1,power_law_1.01,0.24225280761718748
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,32,1,power_law_1.01,0.26107072830200195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,32,1,power_law_1.01,0.28641408920288086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,32,1,power_law_1.01,0.27526336669921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,32,1,power_law_1.01,0.2801190376281738
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,32,1,power_law_1.01,0.29586944580078123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,32,1,power_law_1.01,0.3239603042602539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,32,1,power_law_1.01,0.3535776138305664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,32,1,power_law_1.01,0.4219078445434571
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,32,1,power_law_1.01,0.5099148941040039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,32,1,power_law_1.01,0.715687026977539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,32,1,power_law_1.01,0.851918716430664
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,32,1,power_law_1.01,0.05985856056213379
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,32,1,power_law_1.01,1.1994509124755859
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,32,1,power_law_1.01,0.06594175815582275
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,32,1,power_law_1.01,0.07467135906219483
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,32,1,power_law_1.01,0.09638976097106934
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,32,1,power_law_1.01,1.5595283508300781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,32,1,power_law_1.01,0.12393407821655274
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,32,1,power_law_1.01,0.15049471855163574
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,32,1,power_law_1.01,0.1980985641479492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,32,1,power_law_1.01,0.20616512298583983
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,32,1,power_law_1.01,2.2619660949707034
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,32,1,power_law_1.01,0.2129952049255371
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,32,1,power_law_1.01,0.2183238410949707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,32,1,power_law_1.01,0.22763071060180665
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,32,1,power_law_1.01,0.23618431091308595
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,32,1,power_law_1.01,0.24267648696899413
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,32,1,power_law_1.01,2.9551123046875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,32,1,power_law_1.01,0.2532371139526367
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,32,1,power_law_1.01,0.3421440124511719
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,32,1,power_law_1.01,0.34962112426757813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,32,1,power_law_1.01,0.36128318786621094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,32,1,power_law_1.01,3.6334469604492186
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,32,1,power_law_1.01,0.38954177856445316
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,32,1,power_law_1.01,0.4210041427612305
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,32,1,power_law_1.01,0.515689582824707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,32,1,power_law_1.01,0.5787519836425782
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,32,1,power_law_1.01,0.7114892578124999
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,32,1,power_law_1.01,0.8769785308837891
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,256,32,1,power_law_1.2,0.07154496192932129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,32,1,power_law_1.01,1.1611891174316407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,256,32,1,power_law_1.2,0.09678208351135253
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,256,32,1,power_law_1.2,0.09999679565429688
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,256,32,1,power_law_1.2,0.11344639778137207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,32,1,power_law_1.01,1.4660704040527344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,256,32,1,power_law_1.2,0.1297152042388916
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,256,32,1,power_law_1.2,0.15115903854370116
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,256,32,1,power_law_1.2,0.1930406379699707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,32,1,power_law_1.01,2.0675570678710935
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,256,32,1,power_law_1.2,0.20264703750610352
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,256,32,1,power_law_1.2,0.20827455520629884
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,256,32,1,power_law_1.2,0.21583168029785157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,256,32,1,power_law_1.2,0.23244991302490234
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,256,32,1,power_law_1.2,0.24384895324707032
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,32,1,power_law_1.01,2.6490164184570313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,256,32,1,power_law_1.2,0.2607500839233398
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,256,32,1,power_law_1.2,0.2795071983337402
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,256,32,1,power_law_1.2,0.2908012771606445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,256,32,1,power_law_1.2,0.287956485748291
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,256,32,1,power_law_1.2,0.302677116394043
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,32,1,power_law_1.01,3.235509033203125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,256,32,1,power_law_1.2,0.3377459335327148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,256,32,1,power_law_1.2,0.3668511962890625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,256,32,1,power_law_1.2,0.4420000076293945
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,256,32,1,power_law_1.2,0.5280857467651368
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,256,32,1,power_law_1.2,0.7326233673095703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,256,32,1,power_law_1.2,0.870606689453125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,256,32,1,power_law_1.2,0.06059904098510742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,256,32,1,power_law_1.2,0.06586368083953857
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,256,32,1,power_law_1.2,1.2156403350830078
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,256,32,1,power_law_1.2,0.0727020788192749
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,256,32,1,power_law_1.2,1.5785331726074219
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,256,32,1,power_law_1.2,0.09286272048950195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,256,32,1,power_law_1.2,0.11535679817199707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,256,32,1,power_law_1.2,0.1400870418548584
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,256,32,1,power_law_1.2,2.284357147216797
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,256,32,1,power_law_1.2,0.1927903938293457
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,256,32,1,power_law_1.2,0.20314752578735354
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,256,32,1,power_law_1.2,0.21073087692260742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,256,32,1,power_law_1.2,0.2165760040283203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,256,32,1,power_law_1.2,2.9783416748046876
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,256,32,1,power_law_1.2,0.22695871353149416
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,256,32,1,power_law_1.2,0.23652992248535157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,256,32,1,power_law_1.2,0.24528896331787112
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,256,32,1,power_law_1.2,0.25844608306884764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,256,32,1,power_law_1.2,0.3492665481567383
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,256,32,1,power_law_1.2,0.35694271087646484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,256,32,1,power_law_1.2,3.663223571777344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,256,32,1,power_law_1.2,0.37127681732177736
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,256,32,1,power_law_1.2,0.41604545593261716
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,256,32,1,power_law_1.2,0.4728281784057617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,256,32,1,power_law_1.2,0.539351692199707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,256,32,1,power_law_1.2,0.6010873413085938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,256,32,1,power_law_1.2,0.7413497924804687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,32,1,power_law_1.01,0.03905087947845459
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,256,32,1,power_law_1.2,0.8991532897949218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,32,1,power_law_1.01,0.052308478355407716
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,32,1,power_law_1.01,0.05797056198120117
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,32,1,power_law_1.01,0.06334015846252442
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,256,32,1,power_law_1.2,1.1867072296142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,32,1,power_law_1.01,0.06946112155914307
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,32,1,power_law_1.01,0.08518272399902344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,256,32,1,power_law_1.2,1.4928787231445313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,32,1,power_law_1.01,0.09049920082092286
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,32,1,power_law_1.01,0.09323967933654785
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,32,1,power_law_1.01,0.0963871955871582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,32,1,power_law_1.01,0.09916735649108886
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,32,1,power_law_1.01,0.10570752143859863
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,256,32,1,power_law_1.2,2.0856288146972655
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,256,32,1,power_law_1.2,2.6812319946289063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,32,1,power_law_1.01,0.11934720039367677
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,32,1,power_law_1.01,0.12148032188415528
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,256,32,1,power_law_1.2,3.276078186035156
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,32,1,power_law_1.01,0.1299884796142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,32,1,power_law_1.01,0.12622079849243165
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,32,1,power_law_1.01,0.1339590358734131
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,32,1,power_law_1.01,0.14280639648437501
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,32,1,power_law_1.01,0.17978303909301757
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,32,1,power_law_1.01,0.21791872024536132
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,32,1,power_law_1.01,0.3691769790649414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,32,1,power_law_1.01,0.4913747024536133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,32,1,power_law_1.01,0.15984127998352052
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,32,1,power_law_1.01,0.6839424133300781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,32,1,power_law_1.01,0.03827327966690063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,32,1,power_law_1.01,0.03998208045959473
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,32,1,power_law_1.01,0.8767788696289063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,32,1,power_law_1.01,0.048624000549316405
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,32,1,power_law_1.01,0.056550397872924804
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,32,1,power_law_1.01,0.06483391761779786
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,32,1,power_law_1.01,0.2584569549560547
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,32,1,power_law_1.01,0.08541440010070801
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,32,1,power_law_1.01,1.3014425659179687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,32,1,power_law_1.01,0.09171520233154297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,32,1,power_law_1.01,0.09464639663696289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,32,1,power_law_1.01,0.09603263854980468
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,32,1,power_law_1.01,0.09720383644104004
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,32,1,power_law_1.01,0.10106623649597168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,32,1,power_law_1.01,1.7298162841796874
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,32,1,power_law_1.01,0.1258502388000488
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,32,1,power_law_1.01,0.12856255531311037
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,32,1,power_law_1.01,0.13489343643188476
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,32,1,power_law_1.01,0.13634623527526854
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,32,1,power_law_1.01,0.14312319755554198
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,32,1,power_law_1.01,0.15929344177246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,32,1,power_law_1.01,0.18945791244506835
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,32,1,power_law_1.01,0.2100499153137207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,32,1,power_law_1.01,2.1511654663085937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,32,1,power_law_1.01,0.24986560821533202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,32,1,power_law_1.01,0.2942201614379883
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,32,1,power_law_1.01,0.39424575805664064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,32,1,power_law_1.01,0.4754905700683594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,32,1,power_law_1.01,0.6603103637695312
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,4096,1536,8,128,32,1,power_law_1.2,0.0532863998413086
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,32,1,power_law_1.01,0.850042266845703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,4096,1536,8,128,32,1,power_law_1.2,0.05698495864868164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,4096,1536,8,128,32,1,power_law_1.2,0.06188352108001709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,4096,1536,8,128,32,1,power_law_1.2,0.06805568218231202
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,32,1,power_law_1.01,1.2224691009521484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,4096,1536,8,128,32,1,power_law_1.2,0.0855020809173584
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,4096,1536,8,128,32,1,power_law_1.2,0.0903756809234619
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,4096,1536,8,128,32,1,power_law_1.2,0.09372415542602539
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,4096,1536,8,128,32,1,power_law_1.2,0.09740032196044922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,4096,1536,8,128,32,1,power_law_1.2,0.03959167957305908
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,4096,1536,8,128,32,1,power_law_1.2,0.10047807693481445
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,4096,1536,8,128,32,1,power_law_1.2,0.10676416397094726
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,32,1,power_law_1.01,1.592681579589844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,4096,1536,8,128,32,1,power_law_1.2,0.12026240348815917
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,4096,1536,8,128,32,1,power_law_1.2,0.12291647911071776
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,4096,1536,8,128,32,1,power_law_1.2,0.1280838394165039
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,4096,1536,8,128,32,1,power_law_1.2,0.13156607627868652
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,32,1,power_law_1.01,1.9631552124023437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,4096,1536,8,128,32,1,power_law_1.2,0.13563199996948244
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,4096,1536,8,128,32,1,power_law_1.2,0.14426624298095703
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,4096,1536,8,128,32,1,power_law_1.2,0.16106943130493162
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,4096,1536,8,128,32,1,power_law_1.2,0.18035200119018555
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,4096,1536,8,128,32,1,power_law_1.2,0.21938560485839842
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,4096,1536,8,128,32,1,power_law_1.2,0.26004032135009764
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,4096,1536,8,128,32,1,power_law_1.2,0.36700416564941407
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,4096,1536,8,128,32,1,power_law_1.2,0.5000172805786133
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,4096,1536,8,128,32,1,power_law_1.2,0.6899078369140625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,4096,1536,8,128,32,1,power_law_1.2,0.03805311918258667
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,4096,1536,8,128,32,1,power_law_1.2,0.04000192165374756
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,4096,1536,8,128,32,1,power_law_1.2,0.8873446655273437
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,4096,1536,8,128,32,1,power_law_1.2,0.047516798973083495
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,4096,1536,8,128,32,1,power_law_1.2,0.054535679817199714
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,4096,1536,8,128,32,1,power_law_1.2,0.061505279541015624
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,4096,1536,8,128,32,1,power_law_1.2,0.08834752082824707
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,4096,1536,8,128,32,1,power_law_1.2,1.3160986328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,4096,1536,8,128,32,1,power_law_1.2,0.09266688346862792
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,4096,1536,8,128,32,1,power_law_1.2,0.09524543762207031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,4096,1536,8,128,32,1,power_law_1.2,0.09805055618286132
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,4096,1536,8,128,32,1,power_law_1.2,0.09831808090209962
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,4096,1536,8,128,32,1,power_law_1.2,0.10165184020996094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,4096,1536,8,128,32,1,power_law_1.2,1.7408511352539062
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,4096,1536,8,128,32,1,power_law_1.2,0.12777728080749512
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,4096,1536,8,128,32,1,power_law_1.2,0.13117119789123535
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,4096,1536,8,128,32,1,power_law_1.2,0.1366412830352783
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,4096,1536,8,128,32,1,power_law_1.2,0.1437983989715576
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,4096,1536,8,128,32,1,power_law_1.2,0.1517024040222168
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,4096,1536,8,128,32,1,power_law_1.2,0.17274816513061525
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,4096,1536,8,128,32,1,power_law_1.2,0.19080127716064452
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,4096,1536,8,128,32,1,power_law_1.2,0.21254400253295896
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,4096,1536,8,128,32,1,power_law_1.2,2.171656951904297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,4096,1536,8,128,32,1,power_law_1.2,0.256495361328125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,4096,1536,8,128,32,1,power_law_1.2,0.2969311904907227
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,4096,1536,8,128,32,1,power_law_1.2,0.39884479522705074
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,4096,1536,8,128,32,1,power_law_1.2,0.48311809539794925
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,4096,1536,8,128,32,1,power_law_1.2,0.6644416046142578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,32,1,power_law_1.01,0.08134719848632813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,32,1,power_law_1.01,0.08843839645385743
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,4096,1536,8,128,32,1,power_law_1.2,0.8498528289794922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,32,1,power_law_1.01,0.10265664100646972
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,32,1,power_law_1.01,0.11677760124206542
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,4096,1536,8,128,32,1,power_law_1.2,1.2216742706298827
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,32,1,power_law_1.01,0.1548960018157959
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,32,1,power_law_1.01,0.1624723243713379
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,32,1,power_law_1.01,0.058329601287841794
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,32,1,power_law_1.01,0.16983999252319334
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,32,1,power_law_1.01,0.1776576042175293
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,4096,1536,8,128,32,1,power_law_1.2,1.6048095703125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,32,1,power_law_1.01,0.18273216247558594
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,32,1,power_law_1.01,0.19685312271118166
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,32,1,power_law_1.01,0.20774400711059568
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,32,1,power_law_1.01,0.2155583953857422
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,4096,1536,8,128,32,1,power_law_1.2,1.9771128845214843
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,32,1,power_law_1.01,0.22044031143188478
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,32,1,power_law_1.01,0.22789440155029297
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,32,1,power_law_1.01,0.2349100875854492
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,32,1,power_law_1.01,0.2507072067260742
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,32,1,power_law_1.01,0.2831705665588379
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,32,1,power_law_1.01,0.31828927993774414
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,32,1,power_law_1.01,0.4076927947998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,32,1,power_law_1.01,0.5319692611694335
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,32,1,power_law_1.01,0.7046297454833985
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,32,1,power_law_1.01,0.8731827545166017
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,32,1,power_law_1.01,0.053137922286987306
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,32,1,power_law_1.01,0.06127615928649902
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,32,1,power_law_1.01,1.2498086547851561
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,32,1,power_law_1.01,0.06780928134918213
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,32,1,power_law_1.01,0.08744959831237793
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,32,1,power_law_1.01,0.1050547218322754
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,32,1,power_law_1.01,1.647370300292969
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,32,1,power_law_1.01,0.14131903648376465
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,32,1,power_law_1.01,0.15160256385803222
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,32,1,power_law_1.01,0.16683839797973632
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,32,1,power_law_1.01,0.17515840530395507
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,32,1,power_law_1.01,0.17925312042236327
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,32,1,power_law_1.01,0.18657215118408205
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,32,1,power_law_1.01,0.19339839935302733
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,32,1,power_law_1.01,2.382414093017578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,32,1,power_law_1.01,0.24122495651245118
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,32,1,power_law_1.01,0.2459334373474121
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,32,1,power_law_1.01,0.2536096000671387
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,32,1,power_law_1.01,0.25757183074951173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,32,1,power_law_1.01,0.2714630317687988
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,32,1,power_law_1.01,0.3036396789550781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,32,1,power_law_1.01,3.143535461425781
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,32,1,power_law_1.01,0.33065086364746094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,32,1,power_law_1.01,0.38803264617919925
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,32,1,power_law_1.01,0.4595135879516602
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,32,1,power_law_1.01,0.6133951950073242
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,32,1,power_law_1.01,3.895592346191406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,32,1,power_law_1.01,0.7325888061523438
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,6144,2560,8,160,32,1,power_law_1.2,0.059895682334899905
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,32,1,power_law_1.01,1.020202865600586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,6144,2560,8,160,32,1,power_law_1.2,0.07969855785369873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,6144,2560,8,160,32,1,power_law_1.2,0.0877023983001709
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,32,1,power_law_1.01,1.29427001953125
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,6144,2560,8,160,32,1,power_law_1.2,0.09865663528442384
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,6144,2560,8,160,32,1,power_law_1.2,0.11099136352539063
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,6144,2560,8,160,32,1,power_law_1.2,0.15291647911071776
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,6144,2560,8,160,32,1,power_law_1.2,0.16323968887329102
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,32,1,power_law_1.01,1.865301055908203
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,6144,2560,8,160,32,1,power_law_1.2,0.1724345588684082
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,6144,2560,8,160,32,1,power_law_1.2,0.18127744674682617
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,6144,2560,8,160,32,1,power_law_1.2,0.18807296752929686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,6144,2560,8,160,32,1,power_law_1.2,0.20030912399291992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,6144,2560,8,160,32,1,power_law_1.2,0.21270208358764647
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,6144,2560,8,160,32,1,power_law_1.2,0.22107839584350586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,6144,2560,8,160,32,1,power_law_1.2,0.22700223922729493
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,32,1,power_law_1.01,2.432139587402344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,6144,2560,8,160,32,1,power_law_1.2,0.23384447097778321
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,6144,2560,8,160,32,1,power_law_1.2,0.24204032897949218
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,6144,2560,8,160,32,1,power_law_1.2,0.25592128753662113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,6144,2560,8,160,32,1,power_law_1.2,0.28706687927246094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,6144,2560,8,160,32,1,power_law_1.2,0.32346305847167967
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,32,1,power_law_1.01,3.0005957031249997
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,6144,2560,8,160,32,1,power_law_1.2,0.42852928161621096
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,6144,2560,8,160,32,1,power_law_1.2,0.540577278137207
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,6144,2560,8,160,32,1,power_law_1.2,0.7204051208496094
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,6144,2560,8,160,32,1,power_law_1.2,0.8920511627197266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,6144,2560,8,160,32,1,power_law_1.2,0.05297855854034424
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,6144,2560,8,160,32,1,power_law_1.2,0.058860158920288085
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,6144,2560,8,160,32,1,power_law_1.2,0.06714367866516113
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,6144,2560,8,160,32,1,power_law_1.2,1.2611116790771484
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,6144,2560,8,160,32,1,power_law_1.2,0.08051775932312012
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,6144,2560,8,160,32,1,power_law_1.2,0.09867391586303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,6144,2560,8,160,32,1,power_law_1.2,1.6502764892578123
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,6144,2560,8,160,32,1,power_law_1.2,0.14080448150634767
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,6144,2560,8,160,32,1,power_law_1.2,0.17197952270507813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,6144,2560,8,160,32,1,power_law_1.2,0.15445952415466307
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,6144,2560,8,160,32,1,power_law_1.2,0.1798918342590332
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,6144,2560,8,160,32,1,power_law_1.2,0.18596223831176756
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,6144,2560,8,160,32,1,power_law_1.2,0.19108800888061522
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,6144,2560,8,160,32,1,power_law_1.2,0.1962681579589844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,6144,2560,8,160,32,1,power_law_1.2,2.401722869873047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,6144,2560,8,160,32,1,power_law_1.2,0.2468172836303711
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,6144,2560,8,160,32,1,power_law_1.2,0.2522918319702149
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,6144,2560,8,160,32,1,power_law_1.2,0.25930559158325195
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,6144,2560,8,160,32,1,power_law_1.2,0.26810623168945313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,6144,2560,8,160,32,1,power_law_1.2,0.2806707191467285
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,6144,2560,8,160,32,1,power_law_1.2,0.3076358413696289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,6144,2560,8,160,32,1,power_law_1.2,0.3380972671508789
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,6144,2560,8,160,32,1,power_law_1.2,3.1596218872070314
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,6144,2560,8,160,32,1,power_law_1.2,0.39739521026611324
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,6144,2560,8,160,32,1,power_law_1.2,0.46204353332519527
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,6144,2560,8,160,32,1,power_law_1.2,0.6200806427001953
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,6144,2560,8,160,32,1,power_law_1.2,3.9184634399414064
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,6144,2560,8,160,32,1,power_law_1.2,0.7403603363037109
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,6144,2560,8,160,32,1,power_law_1.2,1.028318099975586
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,6144,2560,8,160,32,1,power_law_1.2,1.306561279296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,32,1,power_law_1.01,0.09360704421997071
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,32,1,power_law_1.01,0.11954367637634278
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,32,1,power_law_1.01,0.12892864227294923
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,32,1,power_law_1.01,0.13400768280029296
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,6144,2560,8,160,32,1,power_law_1.2,1.874849853515625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,32,1,power_law_1.01,0.16731647491455076
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,32,1,power_law_1.01,0.1985286331176758
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,32,1,power_law_1.01,0.2195392036437988
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,32,1,power_law_1.01,0.2636479949951172
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,6144,2560,8,160,32,1,power_law_1.2,2.4403961181640623
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,32,1,power_law_1.01,0.27797119140625004
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,32,1,power_law_1.01,0.2878790473937988
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,32,1,power_law_1.01,0.30135808944702147
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,32,1,power_law_1.01,0.3144601631164551
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,6144,2560,8,160,32,1,power_law_1.2,3.0267367553710938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,32,1,power_law_1.01,0.3350924682617188
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,32,1,power_law_1.01,0.3528319931030274
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,32,1,power_law_1.01,0.3708121490478516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,32,1,power_law_1.01,0.39675647735595704
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,32,1,power_law_1.01,0.3710521697998047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,32,1,power_law_1.01,0.4227865600585938
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,32,1,power_law_1.01,0.4680326461791992
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,32,1,power_law_1.01,0.5850662231445313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,32,1,power_law_1.01,0.6802534484863282
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,32,1,power_law_1.01,0.887734375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,32,1,power_law_1.01,1.0189523315429687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,32,1,power_law_1.01,0.07502592086791993
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,32,1,power_law_1.01,1.399322814941406
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,32,1,power_law_1.01,0.08073856353759765
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,32,1,power_law_1.01,0.09733951568603516
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,32,1,power_law_1.01,1.7764288330078124
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,32,1,power_law_1.01,0.1062553596496582
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,32,1,power_law_1.01,0.15153344154357912
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,32,1,power_law_1.01,0.18984384536743165
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,32,1,power_law_1.01,0.21299200057983397
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,32,1,power_law_1.01,2.55836669921875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,32,1,power_law_1.01,0.2641670417785645
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,32,1,power_law_1.01,0.2769881629943848
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,32,1,power_law_1.01,0.28948928833007814
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,32,1,power_law_1.01,0.3075622367858887
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,32,1,power_law_1.01,3.3075033569335934
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,32,1,power_law_1.01,0.31663808822631834
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,32,1,power_law_1.01,0.33033985137939453
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,32,1,power_law_1.01,0.34439998626708984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,32,1,power_law_1.01,0.3552716827392578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,32,1,power_law_1.01,4.053648681640626
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,32,1,power_law_1.01,0.3636172866821289
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,32,1,power_law_1.01,0.4949798583984375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,32,1,power_law_1.01,0.523576316833496
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,32,1,power_law_1.01,0.5543692779541016
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,32,1,power_law_1.01,0.6307648086547852
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,32,1,power_law_1.01,0.7052787017822266
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,32,1,power_law_1.01,0.8769741058349609
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,32,1,power_law_1.01,1.0141273498535157
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1,7168,2048,8,384,32,1,power_law_1.2,0.09503552436828613
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,32,1,power_law_1.01,1.3378137207031249
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2,7168,2048,8,384,32,1,power_law_1.2,0.11824192047119139
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,32,1,power_law_1.01,1.6567333984375001
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4,7168,2048,8,384,32,1,power_law_1.2,0.1250111961364746
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8,7168,2048,8,384,32,1,power_law_1.2,0.1345299243927002
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16,7168,2048,8,384,32,1,power_law_1.2,0.1581120014190674
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,32,1,power_law_1.01,2.2992767333984374
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,32,7168,2048,8,384,32,1,power_law_1.2,0.1892620849609375
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,48,7168,2048,8,384,32,1,power_law_1.2,0.20694015502929686
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,64,7168,2048,8,384,32,1,power_law_1.2,0.25376960754394534
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,80,7168,2048,8,384,32,1,power_law_1.2,0.26620288848876955
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,96,7168,2048,8,384,32,1,power_law_1.2,0.2792588806152344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,32,1,power_law_1.01,2.9784805297851564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,128,7168,2048,8,384,32,1,power_law_1.2,0.2953727912902832
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,160,7168,2048,8,384,32,1,power_law_1.2,0.3175142478942871
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,192,7168,2048,8,384,32,1,power_law_1.2,0.3281894302368164
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,256,7168,2048,8,384,32,1,power_law_1.2,0.35406272888183593
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,32,1,power_law_1.01,3.6381170654296873
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,320,7168,2048,8,384,32,1,power_law_1.2,0.37407169342041013
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,384,7168,2048,8,384,32,1,power_law_1.2,0.4105184173583984
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,512,7168,2048,8,384,32,1,power_law_1.2,0.37703231811523436
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,768,7168,2048,8,384,32,1,power_law_1.2,0.4332537460327148
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1024,7168,2048,8,384,32,1,power_law_1.2,0.48447807312011715
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,1536,7168,2048,8,384,32,1,power_law_1.2,0.6054540634155273
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,2048,7168,2048,8,384,32,1,power_law_1.2,0.7161945343017578
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,3072,7168,2048,8,384,32,1,power_law_1.2,0.9134374237060546
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,4096,7168,2048,8,384,32,1,power_law_1.2,1.0454592132568359
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1,7168,2048,8,384,32,1,power_law_1.2,0.0751532793045044
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,6144,7168,2048,8,384,32,1,power_law_1.2,1.4292807006835937
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2,7168,2048,8,384,32,1,power_law_1.2,0.08111552238464356
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,8192,7168,2048,8,384,32,1,power_law_1.2,1.79586181640625
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4,7168,2048,8,384,32,1,power_law_1.2,0.09212863922119141
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8,7168,2048,8,384,32,1,power_law_1.2,0.10605695724487305
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16,7168,2048,8,384,32,1,power_law_1.2,0.13806143760681153
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,12288,7168,2048,8,384,32,1,power_law_1.2,2.5707852172851564
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,32,7168,2048,8,384,32,1,power_law_1.2,0.1761907196044922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,48,7168,2048,8,384,32,1,power_law_1.2,0.19799360275268554
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,64,7168,2048,8,384,32,1,power_law_1.2,0.2543168067932129
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,80,7168,2048,8,384,32,1,power_law_1.2,0.2669664001464844
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,96,7168,2048,8,384,32,1,power_law_1.2,0.27841087341308596
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,128,7168,2048,8,384,32,1,power_law_1.2,0.29449024200439455
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,16384,7168,2048,8,384,32,1,power_law_1.2,3.3357254028320313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,160,7168,2048,8,384,32,1,power_law_1.2,0.31137279510498045
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,192,7168,2048,8,384,32,1,power_law_1.2,0.3216185760498047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,256,7168,2048,8,384,32,1,power_law_1.2,0.3368627166748047
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,320,7168,2048,8,384,32,1,power_law_1.2,0.35300289154052733
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,384,7168,2048,8,384,32,1,power_law_1.2,0.36292095184326173
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,float16,20480,7168,2048,8,384,32,1,power_law_1.2,4.073712768554687
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,512,7168,2048,8,384,32,1,power_law_1.2,0.4934368133544922
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,768,7168,2048,8,384,32,1,power_law_1.2,0.5361324691772461
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1024,7168,2048,8,384,32,1,power_law_1.2,0.575736312866211
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,1536,7168,2048,8,384,32,1,power_law_1.2,0.6595654296875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,2048,7168,2048,8,384,32,1,power_law_1.2,0.7564268493652344
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,3072,7168,2048,8,384,32,1,power_law_1.2,0.9147590637207031
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,4096,7168,2048,8,384,32,1,power_law_1.2,1.0877235412597657
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,6144,7168,2048,8,384,32,1,power_law_1.2,1.4056179809570313
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,8192,7168,2048,8,384,32,1,power_law_1.2,1.726875457763672
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,12288,7168,2048,8,384,32,1,power_law_1.2,2.375732421875
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,16384,7168,2048,8,384,32,1,power_law_1.2,3.0376907348632813
SGLang,0.5.6.post2,NVIDIA H200,moe,sglang_fused_moe_triton,fp8_block,20480,7168,2048,8,384,32,1,power_law_1.2,3.685910339355469
