framework,version,device,op_name,kernel_source,moe_dtype,num_tokens,hidden_size,inter_size,topk,num_experts,moe_tp_size,moe_ep_size,distribution,latency
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,uniform,0.3651657147066934
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,uniform,0.35211885826928274
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,power_law_0.6,0.345071542263031
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,power_law_0.6,1.2833225182124546
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,power_law_0.8,0.3416658316339765
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.01,0.3467492571898869
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,power_law_0.8,1.1899318865367345
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.02,0.337226973261152
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,128,power_law_1.2,0.34651428631373815
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.01,1.0744365726198468
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,uniform,0.3461074275629861
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.02,1.028716802597046
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,power_law_0.6,0.3465892561844417
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32,7168,2048,8,256,1,2,power_law_1.2,0.9770980562482562
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,power_law_0.8,0.34252799919673377
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,uniform,0.35432685698781696
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.01,0.35063497253826686
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.02,0.34656822681427
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,power_law_0.6,1.6537124497549875
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,128,power_law_1.2,0.38265599949019297
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,power_law_0.8,1.573978512627738
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,uniform,0.3638902860028403
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.01,1.4925577129636491
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,power_law_0.6,0.3661833133016314
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,power_law_0.8,0.37554102880614143
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.02,1.4547364575522286
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.01,0.46660205721855164
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.02,0.479681829895292
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,uniform,0.3532571366855076
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,2,power_law_1.2,1.5416813680103847
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,uniform,0.3490560054779053
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,128,power_law_1.2,0.5642514262880598
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,power_law_0.6,0.9509906308991568
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,power_law_0.6,1.7335597719464984
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,power_law_0.8,0.8876242348126002
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.01,0.8322276592254638
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,power_law_0.8,1.6925037622451782
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.02,0.894721828188215
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,64,7168,2048,8,256,1,4,power_law_1.2,0.8536841137068613
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,uniform,0.4020205693585532
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.01,1.6306797742843628
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,uniform,0.3470262885093689
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,power_law_0.6,0.4836690264088767
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,power_law_0.6,0.9948041132518224
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.02,1.6133183990206037
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,power_law_0.8,0.9705362319946289
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,power_law_0.8,0.5260105158601488
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,uniform,0.35754056913512094
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,2,power_law_1.2,1.6696749755314417
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.01,0.9227785161563329
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,uniform,0.3591268616063254
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.01,0.7439844591276986
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,power_law_0.6,0.6050971490996224
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.02,0.9363291433879307
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,power_law_0.8,0.5793563417025975
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.02,0.7015186275754656
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,power_law_0.6,1.8428132499967302
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,4,power_law_1.2,0.9297243407794408
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.01,0.5692763430731637
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,uniform,0.34711314524923054
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.02,0.5726619396890913
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,128,power_law_1.2,0.9386697224208287
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,power_law_0.6,1.0349028655460903
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,power_law_0.8,1.7866413729531425
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,128,7168,2048,8,256,1,8,power_law_1.2,0.5336548566818238
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,uniform,0.3594194267477308
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,power_law_0.8,1.0120329073497227
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,power_law_0.6,0.6217581697872707
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,uniform,0.3575634275163923
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.01,1.7706404515675136
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.01,0.9504146286419459
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,power_law_0.8,0.6230674283845085
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,power_law_0.6,0.3451986287321363
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,power_law_0.8,0.3455204554966518
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.01,0.6001343948500497
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.02,0.9904822826385498
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,uniform,0.3545828546796526
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.02,1.7144676651273454
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.01,0.3482139425618308
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.02,0.5832182799066816
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,uniform,0.34850285734449116
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,uniform,0.36745142936706543
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,power_law_0.6,0.35393920115062166
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.02,0.34741028802735463
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,4,power_law_1.2,0.9869385191372463
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,8,power_law_1.2,0.6153389692306519
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,uniform,0.3549851434571402
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,power_law_0.6,0.34859154139246257
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,power_law_0.6,0.4246262865407126
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,64,power_law_1.2,0.3465225126062121
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,power_law_0.8,0.35307428581374034
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,2,power_law_1.2,1.7646683420453753
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,uniform,0.3678217189652579
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,power_law_0.8,0.3467154289994921
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,uniform,0.4428617145333971
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,power_law_0.8,0.4224347446646009
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,uniform,0.3526582803045
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,power_law_0.6,1.0589119911193847
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.01,0.3450761122362954
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.01,0.34225188493728637
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,power_law_0.6,0.642621260029929
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.01,0.41295542887278963
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,power_law_0.6,0.345524115221841
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.02,0.3498605719634465
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.02,0.3359277733734676
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.02,0.4010176011494228
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,power_law_0.8,0.6165467466626848
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,power_law_0.8,1.0324114305632455
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,power_law_0.8,0.34400000061307634
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,power_law_0.6,1.8756736074175153
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,32,power_law_1.2,0.3524946314947946
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,256,power_law_1.2,0.37089828508240835
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,256,7168,2048,8,256,1,16,power_law_1.2,0.40488137517656597
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,uniform,0.4969828597136906
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.01,0.5919387442725045
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.01,0.3426093714577811
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,uniform,0.3473691386835916
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,uniform,0.35774628605161396
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.01,1.0029961228370667
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.02,0.3469549707004002
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.02,0.5882660610335214
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,power_law_0.6,0.34910537259919305
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,power_law_0.6,0.42119040063449315
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,power_law_0.8,1.8530980518886022
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,64,power_law_1.2,0.3478153143610273
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,power_law_0.8,0.3416210285254887
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.02,1.019878395966121
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,power_law_0.8,0.41910857387951445
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,8,power_law_1.2,0.6169636522020613
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,power_law_0.6,0.76327588898795
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,uniform,0.36024228164127897
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.01,0.3478244585650308
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,uniform,0.3522377184459141
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.01,0.4277632006577083
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,uniform,0.3643611456666674
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,4,power_law_1.2,1.0379593099866595
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.02,0.34502400159835817
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,power_law_0.6,0.3585481149809701
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.02,0.42728411555290224
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.01,1.8150555474417551
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,power_law_0.6,0.6486290318625314
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,power_law_0.6,0.3488557721887316
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,uniform,0.44863542914390564
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,32,power_law_1.2,0.3498276582786015
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,power_law_0.8,0.9122194341250829
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,16,power_law_1.2,0.4197348586150578
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,power_law_0.8,0.3603181736809867
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,power_law_0.8,0.6367039969989232
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,power_law_0.8,0.3506587428706033
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,uniform,0.35873828189713614
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,uniform,0.364667432648795
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,power_law_0.6,1.0536466291972568
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.01,0.3775478856904166
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.02,1.75369234085083
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.01,0.6522176027297973
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.01,0.3946441148008619
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,power_law_0.6,0.34798445701599123
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,power_law_0.6,0.4385161135877882
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.02,0.4021997698715755
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,power_law_0.8,0.3539428583213261
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.02,0.6430921145847865
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.02,0.3791442275047302
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,power_law_0.8,0.43282651560647145
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,power_law_0.8,1.0400228466306414
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.01,1.1673115474837168
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.01,0.3766592008726937
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.01,0.4443035432270595
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,64,power_law_1.2,0.44172434295926777
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,256,power_law_1.2,0.5454400037016187
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,8,power_law_1.2,0.682863542011806
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,512,7168,2048,8,256,1,2,power_law_1.2,1.9335753100258963
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.02,0.3703469719205584
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.01,1.0915327991758075
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.02,0.43835062980651857
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,32,power_law_1.2,0.404625369821276
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,uniform,0.6800228442464556
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,uniform,0.449339428118297
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,16,power_law_1.2,0.4679698313985552
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.02,1.3719561168125698
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.02,1.0789942877633232
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,power_law_0.6,0.7162057178361075
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,uniform,0.3569142861025674
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,uniform,0.3754011392593384
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,uniform,0.3599817156791687
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,4,power_law_1.2,1.1495616095406669
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,power_law_0.6,0.47165714246886115
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,power_law_0.8,0.7101211445672172
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,power_law_0.6,1.9265115465436662
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,power_law_0.6,0.4071488005774362
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,power_law_0.6,0.4208073147705623
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,power_law_0.8,0.4835117723260607
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.01,0.7519487977027893
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,power_law_0.8,0.4325613737106323
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,uniform,0.6779794352395194
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,power_law_0.8,0.4498404588018145
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,uniform,0.39758171354021343
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.01,0.47995245371546064
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,128,power_law_1.2,2.348007334981646
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.01,0.47450788191386634
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.02,0.7428553155490331
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,power_law_0.8,1.892640917641776
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.01,0.5414500645228795
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.02,0.4876873161111559
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,power_law_0.6,1.1849563496453421
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,power_law_0.6,0.3966884570462363
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.02,0.47250925983701436
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,8,power_law_1.2,0.793082514830998
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,16,power_law_1.2,0.5065636609281813
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.02,0.5299227399485452
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,32,power_law_1.2,0.49624137026923043
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,power_law_0.8,0.4361846830163683
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,power_law_0.8,1.1802185160773142
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.01,1.9317540645599365
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,64,power_law_1.2,0.663191773210253
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,uniform,0.4588434270450047
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,uniform,0.6921920095171247
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.01,0.6038921134812492
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.01,1.2169572625841414
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,power_law_0.6,0.5620946288108826
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.02,1.9055076565061297
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,power_law_0.6,0.8522788575717382
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,uniform,0.39832685249192373
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.02,0.5939648049218315
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.02,1.2191012620925903
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,power_law_0.8,0.5843346323285784
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,power_law_0.8,0.8645202330180577
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,power_law_0.6,0.5287515435900006
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.01,0.6007067339760916
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,1024,7168,2048,8,256,1,2,power_law_1.2,2.1011547565460207
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,4,power_law_1.2,1.2804452555520194
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,256,power_law_1.2,0.9422976016998291
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,power_law_0.8,0.5464704002652849
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.01,0.9196351987974984
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.02,0.6405037709644863
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,uniform,0.41585828151021687
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,uniform,1.1452891486031669
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.01,0.6493732605661665
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,16,power_law_1.2,0.64637713602611
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.02,0.9147958874702453
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,power_law_0.6,0.575466057232448
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,uniform,1.1507748706000192
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.02,0.6501924565860203
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,8,power_law_1.2,1.0104795455932618
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,power_law_0.6,2.2045266151428224
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,power_law_0.8,0.6803190861429487
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,power_law_0.6,1.4124434300831386
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,32,power_law_1.2,0.7243410297802516
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,uniform,0.5585600052561078
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.01,0.8901193107877459
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,power_law_0.8,1.4031981774738858
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,power_law_0.8,2.1748297146388462
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,power_law_0.6,0.7634523425783429
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,uniform,0.8617280040468488
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.02,0.8624521170343672
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,power_law_0.8,0.7882047959736416
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.01,1.5174994264330184
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.01,2.1924196652003696
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,power_law_0.6,1.1433234316962106
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.01,0.8659739409174237
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,64,power_law_1.2,1.1033983979906354
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,uniform,0.4659337188516344
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.02,1.5708150795527867
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,uniform,0.5538651517459324
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.02,0.8996086869921003
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,power_law_0.8,1.1884699446814402
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.02,2.203762286049979
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,uniform,0.8676708596093314
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,power_law_0.6,0.5877366832324437
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,power_law_0.6,0.7802496007510594
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,4,power_law_1.2,1.5874514273234777
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,16,power_law_1.2,1.0569956524031503
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.01,1.2536703961236135
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,power_law_0.8,0.8225398847034999
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,2048,7168,2048,8,256,1,2,power_law_1.2,2.28885942867824
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,power_law_0.8,0.7208146282604763
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.02,1.266002287183489
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,power_law_0.6,1.375776903969901
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.01,0.9999881165368216
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.01,1.0892178314072745
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,8,power_law_1.2,1.4200100524084909
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,uniform,1.4601417098726546
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,uniform,2.096045766557966
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.02,0.987310630934579
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.02,1.0743862901415144
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,uniform,0.8268114328384399
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,power_law_0.6,1.926026964187622
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,power_law_0.8,1.649097146306719
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,32,power_law_1.2,1.714041600908552
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,uniform,0.6393142768314907
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,power_law_0.6,2.612576927457537
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,power_law_0.6,1.1319049154009138
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,power_law_0.8,2.0275419541767667
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,256,power_law_1.2,1.9832201174327306
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,power_law_0.6,1.0273993151528495
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,power_law_0.8,2.6164434160505023
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,power_law_0.8,1.2423305136816842
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,uniform,1.370125719479152
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.01,2.396929843085153
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.01,2.1873883519853865
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,power_law_0.8,1.1576210294451033
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.01,1.4583552019936699
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.01,2.7607488087245398
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,power_law_0.6,1.713060576575143
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.02,2.1766473191125053
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.02,1.3715492589133127
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.01,1.5274560008730207
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.02,2.7506130218505858
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.02,2.5373458453587125
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,power_law_0.8,1.8757174968719483
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,4,power_law_1.2,2.424609817777361
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,16,power_law_1.2,1.7277065208980016
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.02,1.7966372762407576
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,uniform,0.9021394337926593
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,4096,7168,2048,8,256,1,2,power_law_1.2,2.93711086000715
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.01,1.9942006826400758
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,power_law_0.6,1.3086893694741386
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,64,power_law_1.2,2.6903460570744104
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.02,2.3647890499659945
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,128,power_law_1.2,4.782516138894217
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,power_law_0.8,1.410474055153983
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,8,power_law_1.2,2.548207562310355
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,uniform,2.7155931336539134
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,uniform,2.482815980911255
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.01,1.8851465191159928
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,uniform,0.7212708592414856
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,power_law_0.6,3.590390879767282
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,uniform,1.44915657384055
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,power_law_0.6,3.289536912100656
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.02,2.2711433206285747
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,power_law_0.6,1.071712909426008
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,power_law_0.6,2.1264283657073975
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,power_law_0.8,3.7363163334982734
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,power_law_0.8,3.430124807357788
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,32,power_law_1.2,2.513818519456046
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,power_law_0.8,1.2952941690172468
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,power_law_0.8,2.291202756336757
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.01,4.029760932922363
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.01,3.6498852593558175
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.01,1.9371611424854824
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.01,2.658561795098441
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,uniform,2.5189668451036726
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,uniform,1.1257280111312866
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.02,3.8209380422319685
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.02,3.6663597651890347
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.02,2.6197074277060373
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.02,2.283673599788121
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,power_law_0.6,3.3311478751046315
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,power_law_0.6,1.8032895871571133
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,8192,7168,2048,8,256,1,2,power_law_1.2,4.260469961166382
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,4,power_law_1.2,4.077689572743007
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,16,power_law_1.2,3.7698550837380544
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,power_law_0.8,3.7333211626325333
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,power_law_0.8,2.146608451434544
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,256,power_law_1.2,4.297346728188651
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.01,4.474492338725499
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.01,2.824270636694772
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,uniform,1.640150853565761
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,uniform,4.90741947719029
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,uniform,1.596955418586731
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.02,4.347865601948329
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,power_law_0.6,2.5049536091940743
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.02,3.504882267543248
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,power_law_0.6,6.009877940586635
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,uniform,4.739757674080985
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,power_law_0.8,2.943776914051601
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,8,power_law_1.2,5.299573939187186
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,power_law_0.6,2.485481146403721
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,64,power_law_1.2,5.477546065194266
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,power_law_0.8,6.157601819719587
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,power_law_0.6,6.021046829223633
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.01,4.465353148324149
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,uniform,2.71936457497733
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,power_law_0.8,3.502069956915719
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.01,6.8739529200962615
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,power_law_0.8,6.076145403725761
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.02,4.297021266392299
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,power_law_0.6,4.0199158668518065
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,power_law_1.01,4.3309074401855465
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.02,6.6842633247375485
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.01,6.831331648145404
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,power_law_0.8,4.246268340519497
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,32,power_law_1.2,6.184219401223319
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,uniform,1.318244559424264
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,16384,7168,2048,8,256,1,2,power_law_1.2,6.756818321772984
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,power_law_1.02,4.867244815826416
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.01,5.72520136151995
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.02,7.382743753705706
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,power_law_0.6,2.015811661311558
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,uniform,4.9244891575404575
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.02,5.257658508845738
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,4,power_law_1.2,7.0989311490740095
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,power_law_0.8,2.515466962541853
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,power_law_0.6,6.185824925558908
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,128,power_law_1.2,10.623944228036063
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,uniform,2.10464004107884
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,16,power_law_1.2,7.371071066175189
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,power_law_1.01,4.42494261605399
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,power_law_0.8,7.654831572941371
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,power_law_0.6,3.498203434262957
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,uniform,9.816073145185198
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,power_law_1.02,4.76806218964713
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.01,8.767742102486746
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,power_law_0.8,4.072296217509678
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,power_law_0.6,11.383588572910854
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,uniform,3.1587702887398854
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.02,8.525165707724435
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,256,power_law_1.2,10.09958951132638
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,power_law_1.01,6.274154949188232
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,uniform,9.531711850847516
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,power_law_0.8,11.506112916128975
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,power_law_0.6,5.273756326947893
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,power_law_1.02,7.253268051147461
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,8,power_law_1.2,11.08435205732073
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,power_law_0.8,5.96470308303833
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,power_law_0.6,11.401450974600655
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.01,11.711802428109305
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,uniform,5.3504365512302945
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,64,power_law_1.2,11.634291185651506
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,power_law_1.01,7.333714321681431
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.02,12.10576365334647
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,power_law_0.8,12.350742885044642
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,power_law_0.6,7.898940345219203
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,power_law_1.02,9.185373251778739
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,32768,7168,2048,8,256,1,2,power_law_1.2,11.792597034999302
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.01,13.803361810956682
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,uniform,3.0448868615286693
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,power_law_0.8,8.863552066258022
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.02,12.74002742767334
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,32,power_law_1.2,14.784687505449568
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,power_law_0.6,5.0121142932346885
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,power_law_1.01,10.791701970781599
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,uniform,10.0817505972726
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,65536,7168,2048,8,256,1,4,power_law_1.2,15.47077478681292
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,power_law_0.8,6.524989237104143
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,uniform,2.4982353959764754
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,power_law_1.02,12.673493930271693
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,power_law_0.6,13.458110182625907
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,power_law_0.6,3.825354051589966
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,power_law_1.01,9.291160774230956
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,16,power_law_1.2,15.894074494498117
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,power_law_0.8,4.741431767599924
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,power_law_0.8,14.853506878444128
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,uniform,4.06012351172311
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,power_law_1.02,12.634580993652344
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,power_law_1.01,8.592652743203299
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,power_law_0.6,6.653462818690708
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,power_law_1.01,17.365272603716168
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,power_law_1.02,9.07168824332101
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,power_law_0.8,9.297799382890974
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,128,power_law_1.2,19.731861931937082
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,power_law_1.02,17.038376344953264
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,uniform,6.320160048348563
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,power_law_1.01,11.221198545183455
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,power_law_0.6,9.90594926561628
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,131072,7168,2048,8,256,1,8,power_law_1.2,21.484181104387556
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,256,power_law_1.2,26.596666554042272
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,power_law_1.02,14.458337838309152
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,power_law_0.8,13.869070598057338
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,uniform,10.93555177961077
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,power_law_1.01,17.554276602608816
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,64,power_law_1.2,29.42575732639858
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,power_law_0.6,16.54874518258231
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,power_law_1.02,17.02618239266532
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,power_law_0.8,19.58311860220773
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,32,power_law_1.2,33.87959382193429
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,power_law_1.01,24.248941802978514
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,uniform,5.926304067884173
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,power_law_1.02,22.585743604387556
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,power_law_0.6,10.687732151576451
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,uniform,4.858422892434256
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,262144,7168,2048,8,256,1,16,power_law_1.2,31.211369105747767
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,power_law_0.6,7.53961147580828
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,power_law_0.8,14.631129619053432
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,uniform,8.005051408495222
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,power_law_0.8,9.916405023847307
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,power_law_1.01,21.315267617361886
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,power_law_0.6,14.648745155334472
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,power_law_1.01,23.566278403145926
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,power_law_1.02,21.67429847717285
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,power_law_0.8,19.186664363316126
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,uniform,12.559721265520368
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,power_law_1.02,23.386864362444197
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,power_law_0.6,20.436404037475587
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,power_law_1.01,28.658064542497907
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,128,power_law_1.2,55.133244323730466
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,256,power_law_1.2,49.567279543195454
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,power_law_0.8,25.04123524257115
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,power_law_1.02,30.859188897269114
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,power_law_1.01,30.4286071232387
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,64,power_law_1.2,60.052931213378905
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,power_law_1.02,37.18844958714077
SGLang,0.5.6.post2,NVIDIA H200,moe_context,deepepmoe,fp8_block,524288,7168,2048,8,256,1,32,power_law_1.2,61.63085370744977
